dtcxzyw commited on
Commit
d7f5feb
·
unverified ·
1 Parent(s): 58e7ea9
src/display/utils.py CHANGED
@@ -29,6 +29,7 @@ auto_eval_column_dict.append(
29
  auto_eval_column_dict.append(["model_name", ColumnContent, ColumnContent("Base Model", "markdown", True)])
30
  # Scores
31
  auto_eval_column_dict.append(["score", ColumnContent, ColumnContent("Score", "number", True)])
 
32
  auto_eval_column_dict.append(["full_pass_count", ColumnContent, ColumnContent("Repaired", "number", True)])
33
  auto_eval_column_dict.append(["fast_pass_count", ColumnContent, ColumnContent("Repaired (Fast)", "number", False)])
34
  auto_eval_column_dict.append(["with_hint", ColumnContent, ColumnContent("Hint", "str", True)])
 
29
  auto_eval_column_dict.append(["model_name", ColumnContent, ColumnContent("Base Model", "markdown", True)])
30
  # Scores
31
  auto_eval_column_dict.append(["score", ColumnContent, ColumnContent("Score", "number", True)])
32
+ auto_eval_column_dict.append(["ratio", ColumnContent, ColumnContent("Repair Rate (Repaired/Attempts %)", "number", False)])
33
  auto_eval_column_dict.append(["full_pass_count", ColumnContent, ColumnContent("Repaired", "number", True)])
34
  auto_eval_column_dict.append(["fast_pass_count", ColumnContent, ColumnContent("Repaired (Fast)", "number", False)])
35
  auto_eval_column_dict.append(["with_hint", ColumnContent, ColumnContent("Hint", "str", True)])
src/leaderboard/read_evals.py CHANGED
@@ -101,6 +101,7 @@ class EvalResult:
101
  AutoEvalColumn.model_name.name: make_hyperlink(self.model_url, self.model_name),
102
  AutoEvalColumn.with_hint.name: "w/ hint" if self.with_hint else "w/o hint",
103
  AutoEvalColumn.score.name: round(self.full_pass_count * 100.0 / total_issues, 1),
 
104
  AutoEvalColumn.attempts.name: self.attempts,
105
  AutoEvalColumn.fast_pass_count.name: self.fast_pass_count,
106
  AutoEvalColumn.full_pass_count.name: self.full_pass_count,
 
101
  AutoEvalColumn.model_name.name: make_hyperlink(self.model_url, self.model_name),
102
  AutoEvalColumn.with_hint.name: "w/ hint" if self.with_hint else "w/o hint",
103
  AutoEvalColumn.score.name: round(self.full_pass_count * 100.0 / total_issues, 1),
104
+ AutoEvalColumn.ratio.name: round(self.full_pass_count * 100.0 / self.attempts, 1),
105
  AutoEvalColumn.attempts.name: self.attempts,
106
  AutoEvalColumn.fast_pass_count.name: self.fast_pass_count,
107
  AutoEvalColumn.full_pass_count.name: self.full_pass_count,