Final_Assignment_Template

Paused

martinsu commited on May 4

Commit

61feb08

1 Parent(s): c589af7

Enhance app.py to validate and format SPACE_ID at startup, ensuring proper username/repo structure; update requirements.txt to add pandas dependency.

Files changed (3) hide show

app.py CHANGED Viewed

@@ -283,7 +283,21 @@ if __name__ == "__main__":
     print("\n" + "-"*30 + " App Starting " + "-"*30)
     # Check for SPACE_HOST and SPACE_ID at startup for information
     space_host_startup = os.getenv("SPACE_HOST")
-    space_id_startup = os.getenv("SPACE_ID") # Get SPACE_ID at startup
     if space_host_startup:
         print(f"✅ SPACE_HOST found: {space_host_startup}")

     print("\n" + "-"*30 + " App Starting " + "-"*30)
     # Check for SPACE_HOST and SPACE_ID at startup for information
     space_host_startup = os.getenv("SPACE_HOST")
+    space_id_raw = os.getenv("SPACE_ID", "")
+    # Ensure proper SPACE_ID format with username/repo
+    if not space_id_raw:
+        # Default if completely missing
+        space_id_startup = "martinsu/Final_Assignment_Template"
+    elif "/" in space_id_raw and not space_id_raw.startswith("/"):
+        # Already has proper username/repo format
+        space_id_startup = space_id_raw
+    elif space_id_raw.startswith("/"):
+        # Has a leading slash but missing username
+        space_id_startup = f"martinsu{space_id_raw}"
+    else:
+        # Just repo name without username
+        space_id_startup = f"martinsu/{space_id_raw}"
     if space_host_startup:
         print(f"✅ SPACE_HOST found: {space_host_startup}")

requirements.txt CHANGED Viewed

@@ -10,4 +10,5 @@ daytona_sdk
 yt_dlp
 tavily-python
 langfuse
-langchain

 yt_dlp
 tavily-python
 langfuse
+langchain
+pandas

result_dataset.py ADDED Viewed

+from datasets import load_dataset
+import duckdb
+# Login using e.g. `huggingface-cli login` to access this dataset
+ds = load_dataset("agents-course/unit4-students-scores")
+# Convert the dataset to a Pandas DataFrame
+df = ds["train"].to_pandas()
+# Initialize DuckDB connection
+con = duckdb.connect(":memory:")
+# Register the DataFrame as a table
+con.register("train", df)
+# Example SQL query: Get average score by subject
+query = """
+WITH FilteredTrains AS (
+    SELECT *
+    FROM train
+    WHERE (code LIKE '%' || username || '%') or username = 'martinsu'
+),
+RankedTrains AS (
+    SELECT
+        code,
+        username,
+        score,
+        RANK() OVER (ORDER BY score DESC) AS rank
+    FROM
+        FilteredTrains
+)
+SELECT
+    rank
+FROM
+    RankedTrains
+WHERE
+    username = 'martinsu';
+"""
+result = con.execute(query).fetchdf()
+print(result)