Spaces:
Running
Running
jasonshaoshun
commited on
Commit
·
2490332
1
Parent(s):
b7ce23f
debug
Browse files- src/leaderboard/read_evals.py +16 -15
src/leaderboard/read_evals.py
CHANGED
@@ -141,22 +141,23 @@ class EvalResult_MIB_SUBGRAPH:
|
|
141 |
all_scores.append(score)
|
142 |
|
143 |
# All entries must be present for average
|
144 |
-
required_entries = [
|
145 |
-
|
146 |
-
|
147 |
-
|
148 |
-
|
149 |
-
|
150 |
-
|
151 |
-
|
152 |
-
|
153 |
-
|
154 |
-
|
155 |
-
|
156 |
-
|
157 |
-
]
|
158 |
|
159 |
-
data_dict["Average"] = round(np.mean(all_scores), 2) if all(required_entries) else '-'
|
|
|
160 |
return data_dict
|
161 |
|
162 |
|
|
|
141 |
all_scores.append(score)
|
142 |
|
143 |
# All entries must be present for average
|
144 |
+
# required_entries = [
|
145 |
+
# data_dict['ioi_llama3'] != '-',
|
146 |
+
# data_dict['ioi_qwen2_5'] != '-',
|
147 |
+
# data_dict['ioi_gpt2'] != '-',
|
148 |
+
# data_dict['ioi_gemma2'] != '-',
|
149 |
+
# data_dict['mcqa_llama3'] != '-',
|
150 |
+
# data_dict['mcqa_qwen2_5'] != '-',
|
151 |
+
# data_dict['mcqa_gemma2'] != '-',
|
152 |
+
# data_dict['arithmetic_addition_llama3'] != '-',
|
153 |
+
# data_dict['arithmetic_subtraction_llama3'] != '-',
|
154 |
+
# data_dict['arc_easy_gemma2'] != '-',
|
155 |
+
# data_dict['arc_easy_llama3'] != '-',
|
156 |
+
# data_dict['arc_challenge_llama3'] != '-'
|
157 |
+
# ]
|
158 |
|
159 |
+
# data_dict["Average"] = round(np.mean(all_scores), 2) if all(required_entries) else '-'
|
160 |
+
data_dict["Average"] = round(np.mean(all_scores), 2) if '-' not in data_dict.values() else '-'
|
161 |
return data_dict
|
162 |
|
163 |
|