Spaces:

MLE-Dojo
/

Leaderboard

Running

App Files Files Community

Jerrycool commited on Apr 26

Commit

c13e962

verified ·

1 Parent(s): 3dd92ec

Update app.py

Browse files

Files changed (1) hide show

app.py +64 -141

app.py CHANGED Viewed

@@ -3,55 +3,49 @@ import pandas as pd
 from apscheduler.schedulers.background import BackgroundScheduler
 """
-MLE‑Dojo Benchmark Leaderboard — Polished Edition
--------------------------------------------------
-This version focuses on premium typography, elegant color palette, and richer
-UI controls (including ascending/descending sort) while remaining completely
-self‑contained.
-*️⃣  HOW TO USE
--------------------------------------------------
-1. Install deps →  `pip install gradio pandas apscheduler`
-2. Launch         →  `python mle_dojo_leaderboard_app.py`
-3. Tailor any of the placeholder values (TITLE, INTRODUCTION_TEXT, etc.) to your
-   project or import them from your own `src` package — the try/except block at
-   the top handles either workflow gracefully.
 """
 # ---------------------------------------------------------------------------
-#  Placeholder fall‑back imports (remove once your own src/ is in PYTHONPATH)
 # ---------------------------------------------------------------------------
 try:
     from src.about import (
         CITATION_BUTTON_LABEL,
         CITATION_BUTTON_TEXT,
-        EVALUATION_QUEUE_TEXT,
         INTRODUCTION_TEXT,
         LLM_BENCHMARKS_TEXT,
         TITLE,
     )
-    from src.display.css_html_js import custom_css  # optional
     from src.envs import REPO_ID
     from src.submission.submit import add_new_eval
-    print("✅ Imported UI copy & helpers from src package.")
 except ImportError:
-    print("⚠️  Falling back to local placeholders — customise as needed.")
     CITATION_BUTTON_LABEL = "Citation"
     CITATION_BUTTON_TEXT  = "Please cite us if you use this benchmark…"
-    EVALUATION_QUEUE_TEXT = "Current evaluation queue:"
-    INTRODUCTION_TEXT     = "Welcome to the **MLE‑Dojo Benchmark Leaderboard** — compare LLM agents across real‑world ML engineering tasks."
-    LLM_BENCHMARKS_TEXT   = "Further details about tasks, metrics, and evaluation pipelines."
     TITLE = (
-        "<h1 class='hero-title gradient-text'>\U0001F3C6 MLE‑Dojo Benchmark Leaderboard</h1>"
-        "<p class='subtitle'>Interactive, reproducible &amp; community‑driven ML agent benchmarking</p>"
     )
-    custom_css = ""  # will be extended below
     REPO_ID = "your/space-id"
     def add_new_eval(*_):
         return "Submission placeholder."
 # ---------------------------------------------------------------------------
-#  Data — extend / refresh as new checkpoints are evaluated
 # ---------------------------------------------------------------------------
 data = [
     {"model_name": "gpt-4o-mini",     "url": "https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/", "organizer": "OpenAI",  "license": "Proprietary", "MLE-Lite_Elo": 753,  "Tabular_Elo": 839,  "NLP_Elo": 758,  "CV_Elo": 754,  "Overall": 778},
@@ -66,7 +60,7 @@ data = [
 master_df = pd.DataFrame(data)
 # ---------------------------------------------------------------------------
-#  Category helpers
 # ---------------------------------------------------------------------------
 CATEGORIES = ["Overall", "MLE-Lite", "Tabular", "NLP", "CV"]
 DEFAULT_CATEGORY = "Overall"
@@ -78,130 +72,75 @@ CATEGORY_MAP = {
     "CV": "CV_Elo",
 }
-# ---------------------------------------------------------------------------
-#  Leaderboard Update Routine
-# ---------------------------------------------------------------------------
 def update_leaderboard(category: str, ascending: bool):
-    """Return a fresh, nicely formatted DataFrame based on user selections."""
-    score_col = CATEGORY_MAP.get(category, CATEGORY_MAP[DEFAULT_CATEGORY])
     df = (
-        master_df[["model_name", "url", "organizer", "license", score_col]].copy()
-        .sort_values(by=score_col, ascending=ascending)
         .reset_index(drop=True)
     )
-    # Add Rank & hyperlink the model name
     df.insert(0, "Rank", df.index + 1)
-    df["Model"] = (
-        df.apply(lambda r: f"<a href='{r.url}' target='_blank'>{r.model_name}</a>", axis=1)
-    )
-    df.rename(columns={
-        "organizer": "Organizer",
-        "license": "License",
-        score_col: "Elo Score",
-    }, inplace=True)
     return df[["Rank", "Model", "Organizer", "License", "Elo Score"]]
 # ---------------------------------------------------------------------------
-#  Custom CSS — premium typography & subtle surfaces
 # ---------------------------------------------------------------------------
 custom_css += """
 @import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700;800&display=swap');
-html, body {
-    font-family: 'Inter', 'Helvetica Neue', Arial, sans-serif !important;
-    font-size: 17px !important;   /* slightly larger default */
-    color: #1f2937;
-    background-color: #f9fafb;
     line-height: 1.55;
 }
-/* Gradient text utility */
 .gradient-text {
-    background: linear-gradient(90deg, #0284c7 0%, #6366f1 100%);
-    -webkit-background-clip: text;
-    -webkit-text-fill-color: transparent;
 }
-/* Markdown tweaks */
-.markdown-text h2 {
-    font-weight: 600;
-    margin-top: 1.2em;
-}
-/* Radio buttons & checkboxes */
-.gr-radio, .gr-checkbox {
-    padding: 0.35em 0.75em;
-    border-radius: 0.5rem;
-    background-color: #ffffff;
-    box-shadow: 0 1px 2px rgba(0,0,0,0.06);
-}
-/* Data table */
-#leaderboard-table table {
-    width: 100%;
-    border-collapse: collapse;
-}
-#leaderboard-table th {
-    background-color: #e2e8f0;
-    font-weight: 600;
-    text-transform: uppercase;
-    font-size: 0.85rem;
-    letter-spacing: 0.03em;
-    padding: 0.6em;
-}
-#leaderboard-table td {
-    padding: 0.55em 0.6em;
-    vertical-align: top;
-}
-#leaderboard-table tr:nth-child(even) { background-color: #f8fafc; }
-#leaderboard-table tr:hover          { background-color: #eef2ff; }
 /* Links */
-a { color: #2563eb; text-decoration: none; }
-a:hover { text-decoration: underline; }
-/* Accordion style tweak */
-.gr-accordion .label {
-    font-weight: 600;
-    font-size: 1rem;
-}
 """
 # ---------------------------------------------------------------------------
-#  Gradio App  ✨
 # ---------------------------------------------------------------------------
-demo = gr.Blocks(css=custom_css, theme=gr.themes.Soft(
-    primary_hue="indigo",
-    neutral_hue="slate",
-    font=["Inter", "Helvetica Neue", "Arial", "sans-serif"],
-))
-with demo:
     gr.HTML(TITLE)
     gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs():
-        # ---------- Leaderboard Tab ----------
-        with gr.TabItem("🏅 Leaderboard"):
-            gr.Markdown("### Model Elo Rankings by Category")
             with gr.Row():
-                category_selector = gr.Radio(
-                    choices=CATEGORIES,
-                    value=DEFAULT_CATEGORY,
-                    label="Category",
-                    interactive=True,
-                )
-                order_checkbox = gr.Checkbox(
-                    label="⬆️ Ascending order (lower Elo first)",
-                    value=False,
-                )
-            leaderboard_table = gr.Dataframe(
                 value=update_leaderboard(DEFAULT_CATEGORY, False),
                 headers=["Rank", "Model", "Organizer", "License", "Elo Score"],
                 datatype=["number", "html", "str", "str", "number"],
@@ -210,42 +149,26 @@ with demo:
                 interactive=False,
                 elem_id="leaderboard-table",
             )
-            # wire‑up events
-            category_selector.change(update_leaderboard, [category_selector, order_checkbox], leaderboard_table)
-            order_checkbox.change(update_leaderboard, [category_selector, order_checkbox], leaderboard_table)
-        # ---------- About Tab ----------
         with gr.TabItem("ℹ️ About"):
             gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
-        # ---------- (Optional) Submit Tab ----------
-        # You can re‑enable this section when your `add_new_eval()` & REPO_ID are ready.
-        # with gr.TabItem("🚀 Submit"):
-        #     pass
-    # ---------- Citation Accordion ----------
     with gr.Accordion("📖 Citation", open=False):
-        gr.Textbox(
-            value=CITATION_BUTTON_TEXT,
-            label=CITATION_BUTTON_LABEL,
-            lines=10,
-            show_copy_button=True,
-        )
 # ---------------------------------------------------------------------------
-#  Scheduler (optional) — restart the HF Space every 30 min to free memory
 # ---------------------------------------------------------------------------
 def restart_space():
-    print(f"🔄 Restarting Space → {REPO_ID}")
-    # Example:  `HfApi().restart_space(repo_id=REPO_ID)`
 if __name__ == "__main__":
     if REPO_ID != "your/space-id":
         scheduler = BackgroundScheduler()
         scheduler.add_job(restart_space, "interval", seconds=1800)
         scheduler.start()
-        print("🗓️ Background scheduler active (30 min restart).")
-    print("🚀 Launching Gradio app…")
-    demo.launch()

 from apscheduler.schedulers.background import BackgroundScheduler
 """
+MLE‑Dojo Benchmark Leaderboard — Dark Elegance Edition
+=====================================================
+A refined, low‑glare UI with larger table text, richer surface layering, and a
+subtle neon accent that pops on dark slate backgrounds.
+HOW TO
+------
+* `pip install gradio pandas apscheduler`
+* `python mle_dojo_leaderboard_app.py`
+* Replace placeholder copy (TITLE …) with your own or keep the try/except.
 """
 # ---------------------------------------------------------------------------
+#  Import app copy (falls back to placeholders if src/ is absent)
 # ---------------------------------------------------------------------------
 try:
     from src.about import (
         CITATION_BUTTON_LABEL,
         CITATION_BUTTON_TEXT,
         INTRODUCTION_TEXT,
         LLM_BENCHMARKS_TEXT,
         TITLE,
     )
+    from src.display.css_html_js import custom_css  # optional extra rules
     from src.envs import REPO_ID
     from src.submission.submit import add_new_eval
 except ImportError:
+    # ── Placeholders ───────────────────────────────────────────────────────────
     CITATION_BUTTON_LABEL = "Citation"
     CITATION_BUTTON_TEXT  = "Please cite us if you use this benchmark…"
+    INTRODUCTION_TEXT     = "Welcome to the **MLE‑Dojo Benchmark Leaderboard** — compare LLM agents across realistic ML engineering tasks."
+    LLM_BENCHMARKS_TEXT   = "Further details about tasks, metrics and evaluation pipelines."
     TITLE = (
+        "<h1 class='hero-title gradient-text'>🏆 MLE‑Dojo Benchmark Leaderboard</h1>"
+        "<p class='subtitle'>Interactive, reproducible &amp; community‑driven ML‑agent benchmarking</p>"
     )
+    custom_css = ""
     REPO_ID = "your/space-id"
     def add_new_eval(*_):
         return "Submission placeholder."
 # ---------------------------------------------------------------------------
+#  Data
 # ---------------------------------------------------------------------------
 data = [
     {"model_name": "gpt-4o-mini",     "url": "https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/", "organizer": "OpenAI",  "license": "Proprietary", "MLE-Lite_Elo": 753,  "Tabular_Elo": 839,  "NLP_Elo": 758,  "CV_Elo": 754,  "Overall": 778},
 master_df = pd.DataFrame(data)
 # ---------------------------------------------------------------------------
+#  Helpers
 # ---------------------------------------------------------------------------
 CATEGORIES = ["Overall", "MLE-Lite", "Tabular", "NLP", "CV"]
 DEFAULT_CATEGORY = "Overall"
     "CV": "CV_Elo",
 }
 def update_leaderboard(category: str, ascending: bool):
+    col = CATEGORY_MAP.get(category, CATEGORY_MAP[DEFAULT_CATEGORY])
     df = (
+        master_df[["model_name", "url", "organizer", "license", col]]
+        .sort_values(by=col, ascending=ascending)
         .reset_index(drop=True)
     )
     df.insert(0, "Rank", df.index + 1)
+    df["Model"] = df.apply(lambda r: f"<a href='{r.url}' target='_blank'>{r.model_name}</a>", axis=1)
+    df.rename(columns={"organizer": "Organizer", "license": "License", col: "Elo Score"}, inplace=True)
     return df[["Rank", "Model", "Organizer", "License", "Elo Score"]]
 # ---------------------------------------------------------------------------
+#  Dark‑mode CSS & Larger Table Fonts
 # ---------------------------------------------------------------------------
 custom_css += """
+/* —————  Core Typography ————— */
 @import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700;800&display=swap');
+html,body {
+    font-family: 'Inter', sans-serif !important;
+    font-size: 18px !important;
     line-height: 1.55;
+    color: #e2e8f0;
+    background:#0f172a;
 }
+/* Accent gradient for titles */
 .gradient-text {
+    background:linear-gradient(90deg,#6366f1 0%,#06b6d4 100%);
+    -webkit-background-clip:text; -webkit-text-fill-color:transparent;
 }
+/* Markdown headings */
+.markdown-text h2{font-weight:600;margin-top:1.3em;color:#f1f5f9;}
+/* Radio & checkbox containers */
+.gr-radio, .gr-checkbox{background:#1e293b;border-radius:8px;padding:6px 12px;box-shadow:0 1px 3px rgba(0,0,0,.4);}
+.gr-radio input:checked+label, .gr-checkbox input:checked+label{color:#38bdf8;}
+/* Table Styling */
+#leaderboard-table table{width:100%;border-collapse:collapse;background:#1e293b;border-radius:8px;overflow:hidden;}
+#leaderboard-table th{background:#334155;font-size:0.9rem;font-weight:600;padding:0.7em;color:#f1f5f9;text-transform:uppercase;letter-spacing:.04em;}
+#leaderboard-table td{padding:0.6em;font-size:1.05rem;border-top:1px solid #334155;}
+#leaderboard-table tr:nth-child(even){background:#1c2431;}
+#leaderboard-table tr:hover{background:#475569;}
 /* Links */
+a{color:#38bdf8;} a:hover{text-decoration:underline;}
+/* Accordion */
+.gr-accordion .label{font-weight:600;font-size:1rem;color:#f1f5f9;}
 """
 # ---------------------------------------------------------------------------
+#  Gradio App
 # ---------------------------------------------------------------------------
+app = gr.Blocks(css=custom_css, theme=gr.themes.Soft(primary_hue="sky", neutral_hue="slate", font=["Inter",]))
+with app:
     gr.HTML(TITLE)
     gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs():
+        with gr.TabItem("🏅 Leaderboard"):
+            gr.Markdown("### Model Elo Rankings by Category", elem_classes="markdown-text")
             with gr.Row():
+                category_radio = gr.Radio(CATEGORIES, value=DEFAULT_CATEGORY, label="Category")
+                asc_check      = gr.Checkbox(label="⬆️ Ascending order", value=False)
+            board = gr.Dataframe(
                 value=update_leaderboard(DEFAULT_CATEGORY, False),
                 headers=["Rank", "Model", "Organizer", "License", "Elo Score"],
                 datatype=["number", "html", "str", "str", "number"],
                 interactive=False,
                 elem_id="leaderboard-table",
             )
+            category_radio.change(update_leaderboard, [category_radio, asc_check], board)
+            asc_check.change(update_leaderboard, [category_radio, asc_check], board)
         with gr.TabItem("ℹ️ About"):
             gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
     with gr.Accordion("📖 Citation", open=False):
+        gr.Textbox(value=CITATION_BUTTON_TEXT, label=CITATION_BUTTON_LABEL, lines=10, show_copy_button=True)
 # ---------------------------------------------------------------------------
+#  Optional scheduler (HF Space restarts)
 # ---------------------------------------------------------------------------
 def restart_space():
+    print(f"Restarting space → {REPO_ID}")
 if __name__ == "__main__":
     if REPO_ID != "your/space-id":
         scheduler = BackgroundScheduler()
         scheduler.add_job(restart_space, "interval", seconds=1800)
         scheduler.start()
+    print("Launching app…")
+    app.launch()