Update
Browse files- src/display/utils.py +1 -0
- src/leaderboard/read_evals.py +1 -0
src/display/utils.py
CHANGED
@@ -29,6 +29,7 @@ auto_eval_column_dict.append(
|
|
29 |
auto_eval_column_dict.append(["model_name", ColumnContent, ColumnContent("Base Model", "markdown", True)])
|
30 |
# Scores
|
31 |
auto_eval_column_dict.append(["score", ColumnContent, ColumnContent("Score", "number", True)])
|
|
|
32 |
auto_eval_column_dict.append(["full_pass_count", ColumnContent, ColumnContent("Repaired", "number", True)])
|
33 |
auto_eval_column_dict.append(["fast_pass_count", ColumnContent, ColumnContent("Repaired (Fast)", "number", False)])
|
34 |
auto_eval_column_dict.append(["with_hint", ColumnContent, ColumnContent("Hint", "str", True)])
|
|
|
29 |
auto_eval_column_dict.append(["model_name", ColumnContent, ColumnContent("Base Model", "markdown", True)])
|
30 |
# Scores
|
31 |
auto_eval_column_dict.append(["score", ColumnContent, ColumnContent("Score", "number", True)])
|
32 |
+
auto_eval_column_dict.append(["ratio", ColumnContent, ColumnContent("Repair Rate (Repaired/Attempts %)", "number", False)])
|
33 |
auto_eval_column_dict.append(["full_pass_count", ColumnContent, ColumnContent("Repaired", "number", True)])
|
34 |
auto_eval_column_dict.append(["fast_pass_count", ColumnContent, ColumnContent("Repaired (Fast)", "number", False)])
|
35 |
auto_eval_column_dict.append(["with_hint", ColumnContent, ColumnContent("Hint", "str", True)])
|
src/leaderboard/read_evals.py
CHANGED
@@ -101,6 +101,7 @@ class EvalResult:
|
|
101 |
AutoEvalColumn.model_name.name: make_hyperlink(self.model_url, self.model_name),
|
102 |
AutoEvalColumn.with_hint.name: "w/ hint" if self.with_hint else "w/o hint",
|
103 |
AutoEvalColumn.score.name: round(self.full_pass_count * 100.0 / total_issues, 1),
|
|
|
104 |
AutoEvalColumn.attempts.name: self.attempts,
|
105 |
AutoEvalColumn.fast_pass_count.name: self.fast_pass_count,
|
106 |
AutoEvalColumn.full_pass_count.name: self.full_pass_count,
|
|
|
101 |
AutoEvalColumn.model_name.name: make_hyperlink(self.model_url, self.model_name),
|
102 |
AutoEvalColumn.with_hint.name: "w/ hint" if self.with_hint else "w/o hint",
|
103 |
AutoEvalColumn.score.name: round(self.full_pass_count * 100.0 / total_issues, 1),
|
104 |
+
AutoEvalColumn.ratio.name: round(self.full_pass_count * 100.0 / self.attempts, 1),
|
105 |
AutoEvalColumn.attempts.name: self.attempts,
|
106 |
AutoEvalColumn.fast_pass_count.name: self.fast_pass_count,
|
107 |
AutoEvalColumn.full_pass_count.name: self.full_pass_count,
|