Spaces:
Running
Running
lixuejing
commited on
Commit
·
70172bf
1
Parent(s):
ff262aa
update
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -92,12 +92,13 @@ class EvalResult:
|
|
92 |
for k, v in data["results"].items():
|
93 |
print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
|
94 |
if task.benchmark == k:
|
95 |
-
print(v.get(task.metric, None))
|
96 |
print("accs", accs)
|
97 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
98 |
continue
|
99 |
|
100 |
mean_acc = np.mean(accs) if len(accs) > 0 else 0
|
|
|
101 |
results[task.metric] = mean_acc
|
102 |
|
103 |
return self(
|
@@ -183,14 +184,14 @@ class EvalResult:
|
|
183 |
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
|
184 |
|
185 |
for task in Quotas:
|
186 |
-
#data_dict[task.value.col_name] = self.results.get(task.value.
|
187 |
if task.value.col_name != "CLCC-H":
|
188 |
-
data_dict[task.value.col_name] = self.results.get(task.value.
|
189 |
else:
|
190 |
if self.results.get(task.value.metric, 0) == 0:
|
191 |
data_dict[task.value.col_name] = "-"
|
192 |
else:
|
193 |
-
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.
|
194 |
|
195 |
return data_dict
|
196 |
|
|
|
92 |
for k, v in data["results"].items():
|
93 |
print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
|
94 |
if task.benchmark == k:
|
95 |
+
print("task.benchmark == k get metic",v.get(task.metric, None))
|
96 |
print("accs", accs)
|
97 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
98 |
continue
|
99 |
|
100 |
mean_acc = np.mean(accs) if len(accs) > 0 else 0
|
101 |
+
print("mean_acc", task.metric, mean_acc)
|
102 |
results[task.metric] = mean_acc
|
103 |
|
104 |
return self(
|
|
|
184 |
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
|
185 |
|
186 |
for task in Quotas:
|
187 |
+
#data_dict[task.value.col_name] = self.results.get(task.value.metric, 0)
|
188 |
if task.value.col_name != "CLCC-H":
|
189 |
+
data_dict[task.value.col_name] = self.results.get(task.value.metric, 0)
|
190 |
else:
|
191 |
if self.results.get(task.value.metric, 0) == 0:
|
192 |
data_dict[task.value.col_name] = "-"
|
193 |
else:
|
194 |
+
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.metric, 0)
|
195 |
|
196 |
return data_dict
|
197 |
|