Spaces:
Running
Running
benediktstroebl
commited on
Commit
·
f5fc72d
1
Parent(s):
e10e28c
Update app.py
Browse files
app.py
CHANGED
@@ -228,13 +228,13 @@ with gr.Blocks() as demo:
|
|
228 |
print(parse_json_files(os.path.join(abs_path, "evals_live"), 'mlagentbench').columns)
|
229 |
Leaderboard(
|
230 |
value=parse_json_files(os.path.join(abs_path, "evals_live"), 'usaco'),
|
231 |
-
|
232 |
-
|
233 |
-
|
234 |
-
|
235 |
-
|
236 |
-
|
237 |
-
|
238 |
)
|
239 |
with gr.Row():
|
240 |
scatter_plot = gr.Plot(create_scatter_plot(parse_json_files(os.path.join(abs_path, "evals_live"), 'usaco'), "Total Cost", "Accuracy", "Total Cost (in USD)", "Accuracy", ["Agent Name"]))
|
@@ -363,7 +363,7 @@ with gr.Blocks() as demo:
|
|
363 |
label="Select Columns to Display:",
|
364 |
),
|
365 |
hide_columns=config.SWEBENCH_HIDE_COLUMNS,
|
366 |
-
|
367 |
)
|
368 |
with gr.Row():
|
369 |
scatter_plot = gr.Plot(create_scatter_plot(parse_json_files(os.path.join(abs_path, "evals_live"), 'swebench_verified'), "Total Cost", "Accuracy", "Total Cost (in USD)", "Accuracy", ["Agent Name"]))
|
@@ -490,7 +490,7 @@ with gr.Blocks() as demo:
|
|
490 |
cant_deselect=["Agent Name"],
|
491 |
label="Select Columns to Display:",
|
492 |
),
|
493 |
-
|
494 |
hide_columns=config.SWEBENCH_HIDE_COLUMNS
|
495 |
)
|
496 |
with gr.Row():
|
@@ -618,7 +618,7 @@ with gr.Blocks() as demo:
|
|
618 |
cant_deselect=["Agent Name"],
|
619 |
label="Select Columns to Display:",
|
620 |
),
|
621 |
-
|
622 |
hide_columns=config.MLAGENTBENCH_HIDE_COLUMNS,
|
623 |
)
|
624 |
with gr.Row():
|
|
|
228 |
print(parse_json_files(os.path.join(abs_path, "evals_live"), 'mlagentbench').columns)
|
229 |
Leaderboard(
|
230 |
value=parse_json_files(os.path.join(abs_path, "evals_live"), 'usaco'),
|
231 |
+
select_columns=SelectColumns(
|
232 |
+
default_selection=config.USACO_ON_LOAD_COLUMNS + ["Verified"],
|
233 |
+
cant_deselect=["Agent Name"],
|
234 |
+
label="Select Columns to Display:",
|
235 |
+
),
|
236 |
+
hide_columns=config.USACO_HIDE_COLUMNS,
|
237 |
+
search_columns=config.USACO_SEARCH_COLUMNS,
|
238 |
)
|
239 |
with gr.Row():
|
240 |
scatter_plot = gr.Plot(create_scatter_plot(parse_json_files(os.path.join(abs_path, "evals_live"), 'usaco'), "Total Cost", "Accuracy", "Total Cost (in USD)", "Accuracy", ["Agent Name"]))
|
|
|
363 |
label="Select Columns to Display:",
|
364 |
),
|
365 |
hide_columns=config.SWEBENCH_HIDE_COLUMNS,
|
366 |
+
search_columns=config.SWEBENCH_SEARCH_COLUMNS
|
367 |
)
|
368 |
with gr.Row():
|
369 |
scatter_plot = gr.Plot(create_scatter_plot(parse_json_files(os.path.join(abs_path, "evals_live"), 'swebench_verified'), "Total Cost", "Accuracy", "Total Cost (in USD)", "Accuracy", ["Agent Name"]))
|
|
|
490 |
cant_deselect=["Agent Name"],
|
491 |
label="Select Columns to Display:",
|
492 |
),
|
493 |
+
search_columns=config.SWEBENCH_SEARCH_COLUMNS,
|
494 |
hide_columns=config.SWEBENCH_HIDE_COLUMNS
|
495 |
)
|
496 |
with gr.Row():
|
|
|
618 |
cant_deselect=["Agent Name"],
|
619 |
label="Select Columns to Display:",
|
620 |
),
|
621 |
+
search_columns=config.MLAGENTBENCH_SEARCH_COLUMNS,
|
622 |
hide_columns=config.MLAGENTBENCH_HIDE_COLUMNS,
|
623 |
)
|
624 |
with gr.Row():
|