Update app.py
Browse files
app.py
CHANGED
|
@@ -523,71 +523,71 @@ with main_block as demo:
|
|
| 523 |
outputs=[task_id_output, code_completion, nl_instruction, test_cases, count_output, index_slider]
|
| 524 |
)
|
| 525 |
|
| 526 |
-
|
| 527 |
-
|
| 528 |
-
### Hard Set Ground Truth Pass Rate: 100%
|
| 529 |
-
### Full Set Ground Truth Pass Rate: 99.6%
|
| 530 |
-
|
| 531 |
-
### Note: The code execution session is no longer maintained. Please `pip install -U bigcodebench` and refer to [BigCodeBench Repository](https://github.com/bigcode-project/bigcodebench).
|
| 532 |
-
""")
|
| 533 |
-
|
| 534 |
-
|
| 535 |
-
|
| 536 |
-
|
| 537 |
|
| 538 |
-
|
| 539 |
-
|
| 540 |
-
|
| 541 |
-
|
| 542 |
|
| 543 |
-
|
| 544 |
-
|
| 545 |
-
|
| 546 |
-
|
| 547 |
-
|
| 548 |
|
| 549 |
-
|
| 550 |
-
|
| 551 |
-
|
| 552 |
-
|
| 553 |
-
|
| 554 |
|
| 555 |
-
|
| 556 |
-
|
| 557 |
-
|
| 558 |
-
|
| 559 |
-
|
| 560 |
|
| 561 |
-
|
| 562 |
-
|
| 563 |
|
| 564 |
|
| 565 |
-
|
| 566 |
-
|
| 567 |
-
|
| 568 |
-
|
| 569 |
-
|
| 570 |
-
|
| 571 |
-
|
| 572 |
-
|
| 573 |
-
|
| 574 |
-
|
| 575 |
-
|
| 576 |
-
|
| 577 |
-
|
| 578 |
-
|
| 579 |
-
|
| 580 |
-
|
| 581 |
-
|
| 582 |
-
|
| 583 |
-
|
| 584 |
-
|
| 585 |
-
|
| 586 |
-
|
| 587 |
|
| 588 |
-
|
| 589 |
-
|
| 590 |
-
|
| 591 |
|
| 592 |
with gr.TabItem("🚀 Request", id=4):
|
| 593 |
gr.Markdown(SUBMISSION_TEXT_3)
|
|
|
|
| 523 |
outputs=[task_id_output, code_completion, nl_instruction, test_cases, count_output, index_slider]
|
| 524 |
)
|
| 525 |
|
| 526 |
+
# with gr.TabItem("🛠️ Code Execution (Beta)", id=5):
|
| 527 |
+
# gr.Markdown("""\
|
| 528 |
+
# ### Hard Set Ground Truth Pass Rate: 100%
|
| 529 |
+
# ### Full Set Ground Truth Pass Rate: 99.6%
|
| 530 |
+
|
| 531 |
+
# ### Note: The code execution session is no longer maintained. Please `pip install -U bigcodebench` and refer to [BigCodeBench Repository](https://github.com/bigcode-project/bigcodebench).
|
| 532 |
+
# """)
|
| 533 |
+
# with gr.Row():
|
| 534 |
+
# jsonl_file = gr.File(label="Upload JSONL file", file_types=[".jsonl"])
|
| 535 |
+
# split = gr.Dropdown(choices=["complete", "instruct"], label="Split", value="complete")
|
| 536 |
+
# subset = gr.Dropdown(choices=["hard", "full"], label="Subset", value="hard")
|
| 537 |
|
| 538 |
+
# with gr.Row():
|
| 539 |
+
# parallel = gr.Number(label="Parallel (optional)", precision=0)
|
| 540 |
+
# min_time_limit = gr.Number(label="Min Time Limit", value=1, precision=1)
|
| 541 |
+
# max_as_limit = gr.Number(label="Max AS Limit", value=25*1024, precision=0)
|
| 542 |
|
| 543 |
+
# with gr.Row():
|
| 544 |
+
# max_data_limit = gr.Number(label="Max Data Limit", value=25*1024, precision=0)
|
| 545 |
+
# max_stack_limit = gr.Number(label="Max Stack Limit", value=10, precision=0)
|
| 546 |
+
# check_gt_only = gr.Checkbox(label="Check GT Only", value=False, visible=False)
|
| 547 |
+
# no_gt = gr.Checkbox(label="No GT", value=False, visible=False)
|
| 548 |
|
| 549 |
+
# command_output = gr.Textbox(label="Command", value=default_command, interactive=False)
|
| 550 |
+
# with gr.Row():
|
| 551 |
+
# submit_btn = gr.Button("Run Evaluation")
|
| 552 |
+
# download_btn = gr.DownloadButton(label="Download Result", visible=False)
|
| 553 |
+
# log_output = gr.Textbox(label="Execution Logs", lines=20)
|
| 554 |
|
| 555 |
+
# input_components = [
|
| 556 |
+
# jsonl_file, split, subset, parallel,
|
| 557 |
+
# min_time_limit, max_as_limit, max_data_limit, max_stack_limit,
|
| 558 |
+
# check_gt_only, no_gt
|
| 559 |
+
# ]
|
| 560 |
|
| 561 |
+
# for component in input_components:
|
| 562 |
+
# component.change(generate_command, inputs=input_components, outputs=command_output)
|
| 563 |
|
| 564 |
|
| 565 |
+
# def start_evaluation(command, jsonl_file, subset, split):
|
| 566 |
+
# lock.acquire()
|
| 567 |
+
# if jsonl_file is not None:
|
| 568 |
+
# result_path = os.path.basename(jsonl_file.name).replace(".jsonl", "_eval_results.json")
|
| 569 |
+
# else:
|
| 570 |
+
# result_path = None
|
| 571 |
+
|
| 572 |
+
# for log in stream_logs(command, jsonl_file):
|
| 573 |
+
# if jsonl_file is not None and jsonl_file.name.endswith(".jsonl"):
|
| 574 |
+
# yield log, gr.update(value=result_path, label=result_path, visible=True), gr.update(visible=False)
|
| 575 |
+
# else:
|
| 576 |
+
# yield log, gr.update(), gr.update()
|
| 577 |
+
# lock.release()
|
| 578 |
+
# result_file = find_result_file()
|
| 579 |
+
# if result_file:
|
| 580 |
+
# return gr.update(label="Evaluation completed. Result file found."), gr.update(value=result_file)
|
| 581 |
+
# # gr.Button(visible=False)#,
|
| 582 |
+
# # gr.DownloadButton(label="Download Result", value=result_file, visible=True))
|
| 583 |
+
# else:
|
| 584 |
+
# return gr.update(label="Evaluation completed. No result file found."), gr.update(value=result_path)
|
| 585 |
+
# # gr.Button("Run Evaluation", visible=True),
|
| 586 |
+
# # gr.DownloadButton(visible=False))
|
| 587 |
|
| 588 |
+
# submit_btn.click(start_evaluation,
|
| 589 |
+
# inputs=[command_output, jsonl_file, subset, split],
|
| 590 |
+
# outputs=[log_output, download_btn, submit_btn])
|
| 591 |
|
| 592 |
with gr.TabItem("🚀 Request", id=4):
|
| 593 |
gr.Markdown(SUBMISSION_TEXT_3)
|