Spaces:
Running
Running
lixuejing
commited on
Commit
·
56d2f27
1
Parent(s):
654e2b1
update
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -88,6 +88,12 @@ class EvalResult:
|
|
88 |
print("task", task, "task.metric",task.metric, "task.benchmark", task.benchmark)
|
89 |
# We average all scores of a given metric (not all metrics are present in all files)
|
90 |
accs = np.array([v.get(task.metric, None) for k, v in data["results"].items() if task.benchmark == k])
|
|
|
|
|
|
|
|
|
|
|
|
|
91 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
92 |
continue
|
93 |
|
|
|
88 |
print("task", task, "task.metric",task.metric, "task.benchmark", task.benchmark)
|
89 |
# We average all scores of a given metric (not all metrics are present in all files)
|
90 |
accs = np.array([v.get(task.metric, None) for k, v in data["results"].items() if task.benchmark == k])
|
91 |
+
|
92 |
+
for k, v in data["results"].items():
|
93 |
+
print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
|
94 |
+
if task.benchmark == k:
|
95 |
+
print(v.get(task.metric, None))
|
96 |
+
print("accs", accs)
|
97 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
98 |
continue
|
99 |
|