Spaces:
Running
Running
jasonshaoshun
commited on
Commit
·
ea7f09a
1
Parent(s):
2490332
debug
Browse files- src/display/utils.py +0 -3
- src/leaderboard/read_evals.py +1 -1
src/display/utils.py
CHANGED
@@ -157,9 +157,6 @@ for field in auto_eval_column_dict_mib_subgraph:
|
|
157 |
|
158 |
|
159 |
|
160 |
-
|
161 |
-
|
162 |
-
|
163 |
# Create the dataclass for MIB columns
|
164 |
AutoEvalColumn_mib_subgraph = make_dataclass("AutoEvalColumn_mib_subgraph", auto_eval_column_dict_mib_subgraph, frozen=True)
|
165 |
|
|
|
157 |
|
158 |
|
159 |
|
|
|
|
|
|
|
160 |
# Create the dataclass for MIB columns
|
161 |
AutoEvalColumn_mib_subgraph = make_dataclass("AutoEvalColumn_mib_subgraph", auto_eval_column_dict_mib_subgraph, frozen=True)
|
162 |
|
src/leaderboard/read_evals.py
CHANGED
@@ -110,7 +110,7 @@ class EvalResult_MIB_SUBGRAPH:
|
|
110 |
expected_models = TasksMib_Subgraph.get_all_models()
|
111 |
expected_tasks = TasksMib_Subgraph.get_all_tasks()
|
112 |
for task in expected_tasks:
|
113 |
-
for model in
|
114 |
# if model == "gpt2" and task != "ioi":
|
115 |
# continue
|
116 |
# if model == "qwen2_5" and task.startswith(("arithmetic", "arc")):
|
|
|
110 |
expected_models = TasksMib_Subgraph.get_all_models()
|
111 |
expected_tasks = TasksMib_Subgraph.get_all_tasks()
|
112 |
for task in expected_tasks:
|
113 |
+
for model in task.value.models::
|
114 |
# if model == "gpt2" and task != "ioi":
|
115 |
# continue
|
116 |
# if model == "qwen2_5" and task.startswith(("arithmetic", "arc")):
|