Spaces:
Runtime error
Runtime error
jasonshaoshun
commited on
Commit
·
55ba7bd
1
Parent(s):
eaedb33
debug
Browse files- src/leaderboard/read_evals.py +26 -10
src/leaderboard/read_evals.py
CHANGED
@@ -286,10 +286,30 @@ class EvalResult_MIB_CAUSALGRAPH:
|
|
286 |
|
287 |
# return data_dict
|
288 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
289 |
def to_dict(self):
|
290 |
"""Converts the Eval Result to a dict for dataframe display"""
|
291 |
-
print(f"Results in to_dict: {self.results}") # Debug print
|
292 |
-
|
293 |
data_dict = {
|
294 |
"eval_name": self.eval_name,
|
295 |
"Method": self.method_name,
|
@@ -298,14 +318,10 @@ class EvalResult_MIB_CAUSALGRAPH:
|
|
298 |
# Process each model's results
|
299 |
for model_id, scores in self.results.items():
|
300 |
model_name = model_id.lower()
|
301 |
-
|
302 |
-
|
303 |
-
|
304 |
-
|
305 |
-
|
306 |
-
for intervention_data in intervention_scores:
|
307 |
-
col_name = f"{model_name}_layer{layer}_{intervention_data['intervention']}".lower()
|
308 |
-
data_dict[col_name] = intervention_data['score']
|
309 |
|
310 |
return data_dict
|
311 |
|
|
|
286 |
|
287 |
# return data_dict
|
288 |
|
289 |
+
# def to_dict(self):
|
290 |
+
# """Converts the Eval Result to a dict for dataframe display"""
|
291 |
+
# print(f"Results in to_dict: {self.results}") # Debug print
|
292 |
+
|
293 |
+
# data_dict = {
|
294 |
+
# "eval_name": self.eval_name,
|
295 |
+
# "Method": self.method_name,
|
296 |
+
# }
|
297 |
+
|
298 |
+
# # Process each model's results
|
299 |
+
# for model_id, scores in self.results.items():
|
300 |
+
# model_name = model_id.lower()
|
301 |
+
# for task, layer_scores in scores.items():
|
302 |
+
# for layer_data in layer_scores:
|
303 |
+
# layer = layer_data.get("layer")
|
304 |
+
# intervention_scores = layer_data.get("scores", [])
|
305 |
+
|
306 |
+
# for intervention_data in intervention_scores:
|
307 |
+
# col_name = f"{model_name}_layer{layer}_{intervention_data['intervention']}".lower()
|
308 |
+
# data_dict[col_name] = intervention_data['score']
|
309 |
+
|
310 |
+
# return data_dict
|
311 |
def to_dict(self):
|
312 |
"""Converts the Eval Result to a dict for dataframe display"""
|
|
|
|
|
313 |
data_dict = {
|
314 |
"eval_name": self.eval_name,
|
315 |
"Method": self.method_name,
|
|
|
318 |
# Process each model's results
|
319 |
for model_id, scores in self.results.items():
|
320 |
model_name = model_id.lower()
|
321 |
+
# The scores are already in the format we want
|
322 |
+
for key, value in scores.items():
|
323 |
+
col_name = f"{model_name}_{key}"
|
324 |
+
data_dict[col_name] = value
|
|
|
|
|
|
|
|
|
325 |
|
326 |
return data_dict
|
327 |
|