lixuejing commited on
Commit
70172bf
·
1 Parent(s): ff262aa
Files changed (1) hide show
  1. src/leaderboard/read_evals.py +5 -4
src/leaderboard/read_evals.py CHANGED
@@ -92,12 +92,13 @@ class EvalResult:
92
  for k, v in data["results"].items():
93
  print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
94
  if task.benchmark == k:
95
- print(v.get(task.metric, None))
96
  print("accs", accs)
97
  if accs.size == 0 or any([acc is None for acc in accs]):
98
  continue
99
 
100
  mean_acc = np.mean(accs) if len(accs) > 0 else 0
 
101
  results[task.metric] = mean_acc
102
 
103
  return self(
@@ -183,14 +184,14 @@ class EvalResult:
183
  data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
184
 
185
  for task in Quotas:
186
- #data_dict[task.value.col_name] = self.results.get(task.value.benchmark, 0)
187
  if task.value.col_name != "CLCC-H":
188
- data_dict[task.value.col_name] = self.results.get(task.value.benchmark, 0)
189
  else:
190
  if self.results.get(task.value.metric, 0) == 0:
191
  data_dict[task.value.col_name] = "-"
192
  else:
193
- data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
194
 
195
  return data_dict
196
 
 
92
  for k, v in data["results"].items():
93
  print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
94
  if task.benchmark == k:
95
+ print("task.benchmark == k get metic",v.get(task.metric, None))
96
  print("accs", accs)
97
  if accs.size == 0 or any([acc is None for acc in accs]):
98
  continue
99
 
100
  mean_acc = np.mean(accs) if len(accs) > 0 else 0
101
+ print("mean_acc", task.metric, mean_acc)
102
  results[task.metric] = mean_acc
103
 
104
  return self(
 
184
  data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
185
 
186
  for task in Quotas:
187
+ #data_dict[task.value.col_name] = self.results.get(task.value.metric, 0)
188
  if task.value.col_name != "CLCC-H":
189
+ data_dict[task.value.col_name] = self.results.get(task.value.metric, 0)
190
  else:
191
  if self.results.get(task.value.metric, 0) == 0:
192
  data_dict[task.value.col_name] = "-"
193
  else:
194
+ data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.metric, 0)
195
 
196
  return data_dict
197