Spaces:

kostis-init
/

CP-Bench-Leaderboard

Running

kostis-init commited on Aug 8

Commit

133e122

1 Parent(s): 15c4da2

fix when counting subm models

Files changed (1) hide show

src/user_eval.py CHANGED Viewed

@@ -258,9 +258,12 @@ def evaluate_submission(submitted_models, summary_file_path, modelling_framw, to
         # Iterate through downloaded submitted models
         for submitted_model in tqdm(submitted_models):
             curr_model = submitted_model[GT_MODEL_CODE_COLUMN]
             total_submitted_models += 1
-            problem_name = submitted_model[GT_PROBLEM_NAME_COLUMN]
             print(f"\n  Processing model: {problem_name}", flush=True)
             summary_f.write(f"\n--- Model: {problem_name} ---\n")
@@ -299,7 +302,6 @@ def evaluate_submission(submitted_models, summary_file_path, modelling_framw, to
             summary_f.write("    3. Performing self-consistency check on ground-truth model...\n")
             modified_gt_script = get_modified_script(ground_truth_script_content, generated_solution)
-            total_submitted_models_that_also_exist_in_gt += 1
             try:
                 with tempfile.NamedTemporaryFile(mode='w', suffix='.py', delete=False, encoding='utf-8',
                                                  dir=top_lvl_temp_dir) as tmp_file:

         # Iterate through downloaded submitted models
         for submitted_model in tqdm(submitted_models):
             curr_model = submitted_model[GT_MODEL_CODE_COLUMN]
+            problem_name = submitted_model[GT_PROBLEM_NAME_COLUMN]
             total_submitted_models += 1
+            if problem_name in ground_truth_models:
+                total_submitted_models_that_also_exist_in_gt += 1
             print(f"\n  Processing model: {problem_name}", flush=True)
             summary_f.write(f"\n--- Model: {problem_name} ---\n")
             summary_f.write("    3. Performing self-consistency check on ground-truth model...\n")
             modified_gt_script = get_modified_script(ground_truth_script_content, generated_solution)
             try:
                 with tempfile.NamedTemporaryFile(mode='w', suffix='.py', delete=False, encoding='utf-8',
                                                  dir=top_lvl_temp_dir) as tmp_file: