Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -143,7 +143,7 @@ with gr.Blocks(css=CSS) as demo:
|
|
143 |
]
|
144 |
)
|
145 |
|
146 |
-
|
147 |
action_components['eval_button'].click(
|
148 |
fn=start_evaluation,
|
149 |
inputs=[evaluation_state],
|
@@ -189,10 +189,11 @@ with gr.Blocks(css=CSS) as demo:
|
|
189 |
model_components['model2_shots'],
|
190 |
model_components['model2_regex'],
|
191 |
model_components['model2_flash_attn']
|
192 |
-
]
|
|
|
193 |
).then(
|
194 |
fn=handle_evaluation_results,
|
195 |
-
inputs=[], #
|
196 |
outputs=[
|
197 |
results_components['output'],
|
198 |
results_components['table'],
|
|
|
143 |
]
|
144 |
)
|
145 |
|
146 |
+
# Connect evaluation button with state tracking
|
147 |
action_components['eval_button'].click(
|
148 |
fn=start_evaluation,
|
149 |
inputs=[evaluation_state],
|
|
|
189 |
model_components['model2_shots'],
|
190 |
model_components['model2_regex'],
|
191 |
model_components['model2_flash_attn']
|
192 |
+
],
|
193 |
+
outputs=results_components['output'] # Change: Only pass 1 output to match the dictionary from run_mmlu_evaluation
|
194 |
).then(
|
195 |
fn=handle_evaluation_results,
|
196 |
+
inputs=[results_components['output']], # Change: Pass the dictionary to handle_evaluation_results
|
197 |
outputs=[
|
198 |
results_components['output'],
|
199 |
results_components['table'],
|