Commit
·
ec0f651
1
Parent(s):
2402663
add
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -130,6 +130,7 @@ class EvalResult:
|
|
130 |
try:
|
131 |
data_dict[task.value.col_name] = self.results[task.value.benchmark]
|
132 |
except KeyError as e:
|
|
|
133 |
print(self.results.keys())
|
134 |
|
135 |
return data_dict
|
@@ -189,12 +190,12 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
189 |
eval_results[eval_name].results.update({k: v for k, v in eval_result.results.items() if v is not None})
|
190 |
else:
|
191 |
eval_results[eval_name] = eval_result
|
192 |
-
print(eval_results)
|
193 |
|
194 |
results = []
|
195 |
for v in eval_results.values():
|
196 |
try:
|
197 |
-
|
198 |
results.append(v)
|
199 |
except KeyError as e: # not all eval values present
|
200 |
print(e)
|
|
|
130 |
try:
|
131 |
data_dict[task.value.col_name] = self.results[task.value.benchmark]
|
132 |
except KeyError as e:
|
133 |
+
print(e)
|
134 |
print(self.results.keys())
|
135 |
|
136 |
return data_dict
|
|
|
190 |
eval_results[eval_name].results.update({k: v for k, v in eval_result.results.items() if v is not None})
|
191 |
else:
|
192 |
eval_results[eval_name] = eval_result
|
193 |
+
# print(eval_results)
|
194 |
|
195 |
results = []
|
196 |
for v in eval_results.values():
|
197 |
try:
|
198 |
+
v.to_dict() # we test if the dict version is complete
|
199 |
results.append(v)
|
200 |
except KeyError as e: # not all eval values present
|
201 |
print(e)
|