Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Update src/leaderboard/read_evals.py
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -73,10 +73,8 @@ class EvalResult:
|
|
73 |
|
74 |
scores = data["scores"]
|
75 |
results = {}
|
76 |
-
for
|
77 |
-
|
78 |
-
if task_value.metric in scores:
|
79 |
-
results[task_value.benchmark] = Decimal(scores[task_value.metric])
|
80 |
|
81 |
|
82 |
return self(
|
@@ -109,7 +107,6 @@ class EvalResult:
|
|
109 |
|
110 |
def to_dict(self):
|
111 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
112 |
-
average = sum([v for v in self.results.values() if v is not None]) / len(Tasks)
|
113 |
data_dict = {
|
114 |
"eval_name": self.eval_name, # not a column, just a save name,
|
115 |
AutoEvalColumn.precision.name: self.precision.value.name,
|
@@ -127,8 +124,8 @@ class EvalResult:
|
|
127 |
}
|
128 |
|
129 |
for task in Tasks:
|
130 |
-
|
131 |
-
data_dict[
|
132 |
|
133 |
return data_dict
|
134 |
|
|
|
73 |
|
74 |
scores = data["scores"]
|
75 |
results = {}
|
76 |
+
for key, value in scores.items():
|
77 |
+
results[key] = Decimal(value)
|
|
|
|
|
78 |
|
79 |
|
80 |
return self(
|
|
|
107 |
|
108 |
def to_dict(self):
|
109 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
|
|
110 |
data_dict = {
|
111 |
"eval_name": self.eval_name, # not a column, just a save name,
|
112 |
AutoEvalColumn.precision.name: self.precision.value.name,
|
|
|
124 |
}
|
125 |
|
126 |
for task in Tasks:
|
127 |
+
task_value = task.value
|
128 |
+
data_dict[task_value.col_name] = self.results[task_value.metric]
|
129 |
|
130 |
return data_dict
|
131 |
|