jasonshaoshun commited on
Commit
ea7f09a
·
1 Parent(s): 2490332
src/display/utils.py CHANGED
@@ -157,9 +157,6 @@ for field in auto_eval_column_dict_mib_subgraph:
157
 
158
 
159
 
160
-
161
-
162
-
163
  # Create the dataclass for MIB columns
164
  AutoEvalColumn_mib_subgraph = make_dataclass("AutoEvalColumn_mib_subgraph", auto_eval_column_dict_mib_subgraph, frozen=True)
165
 
 
157
 
158
 
159
 
 
 
 
160
  # Create the dataclass for MIB columns
161
  AutoEvalColumn_mib_subgraph = make_dataclass("AutoEvalColumn_mib_subgraph", auto_eval_column_dict_mib_subgraph, frozen=True)
162
 
src/leaderboard/read_evals.py CHANGED
@@ -110,7 +110,7 @@ class EvalResult_MIB_SUBGRAPH:
110
  expected_models = TasksMib_Subgraph.get_all_models()
111
  expected_tasks = TasksMib_Subgraph.get_all_tasks()
112
  for task in expected_tasks:
113
- for model in expected_models:
114
  # if model == "gpt2" and task != "ioi":
115
  # continue
116
  # if model == "qwen2_5" and task.startswith(("arithmetic", "arc")):
 
110
  expected_models = TasksMib_Subgraph.get_all_models()
111
  expected_tasks = TasksMib_Subgraph.get_all_tasks()
112
  for task in expected_tasks:
113
+ for model in task.value.models::
114
  # if model == "gpt2" and task != "ioi":
115
  # continue
116
  # if model == "qwen2_5" and task.startswith(("arithmetic", "arc")):