Spaces:

bigcode
/

bigcodebench-evaluator

Running on CPU Upgrade

App Files Files Community

Terry Zhuo commited on Aug 12

Commit

5729010

•

1 Parent(s): b64230f

update

Browse files

Files changed (1) hide show

app.py +52 -52

app.py CHANGED Viewed

@@ -512,66 +512,66 @@ with main_block as demo:
         with gr.TabItem("🚀 Request", id=4):
             gr.Markdown(SUBMISSION_TEXT_3)
-        # with gr.TabItem("🛠️ Execute", id=5):
-        #     gr.Markdown("# BigCodeBench Evaluator")
-        #     with gr.Row():
-        #         jsonl_file = gr.File(label="Upload JSONL file", file_types=[".jsonl"])
-        #         split = gr.Dropdown(choices=["complete", "instruct"], label="Split", value="complete")
-        #         subset = gr.Dropdown(choices=["hard"], label="Subset", value="hard")
-        #     with gr.Row():
-        #         parallel = gr.Number(label="Parallel (optional)", precision=0)
-        #         min_time_limit = gr.Number(label="Min Time Limit", value=1, precision=1)
-        #         max_as_limit = gr.Number(label="Max AS Limit", value=25*1024, precision=0)
-        #     with gr.Row():
-        #         max_data_limit = gr.Number(label="Max Data Limit", value=25*1024, precision=0)
-        #         max_stack_limit = gr.Number(label="Max Stack Limit", value=10, precision=0)
-        #         check_gt_only = gr.Checkbox(label="Check GT Only")
-        #         no_gt = gr.Checkbox(label="No GT")
-        #     command_output = gr.Textbox(label="Command", value=default_command, interactive=False)
-        #     with gr.Row():
-        #         submit_btn = gr.Button("Run Evaluation")
-        #         download_btn = gr.DownloadButton(label="Download Result")
-        #     log_output = gr.Textbox(label="Execution Logs", lines=20)
-        #     input_components = [
-        #         jsonl_file, split, subset, parallel,
-        #         min_time_limit, max_as_limit, max_data_limit, max_stack_limit,
-        #         check_gt_only, no_gt
-        #     ]
-        #     for component in input_components:
-        #         component.change(generate_command, inputs=input_components, outputs=command_output)
-        #     def start_evaluation(command, jsonl_file, subset, split):
-        #         extra = subset + "_" if subset != "full" else ""
-        #         if jsonl_file is not None:
-        #             result_path = os.path.basename(jsonl_file.name).replace(".jsonl", f"_{extra}eval_results.json")
-        #         else:
-        #             result_path = None
-        #         for log in stream_logs(command, jsonl_file):
-        #             if jsonl_file is not None:
-        #                 yield log, gr.update(value=result_path, label=result_path), gr.update()
-        #             else:
-        #                 yield log, gr.update(), gr.update()
-        #         is_running = False
-        #         result_file = find_result_file()
-        #         if result_file:
-        #             return gr.update(label="Evaluation completed. Result file found."), gr.update(value=result_file)
-        #                     # gr.Button(visible=False)#,
-        #                     # gr.DownloadButton(label="Download Result", value=result_file, visible=True))
-        #         else:
-        #             return gr.update(label="Evaluation completed. No result file found."), gr.update(value=result_path)
-        #                     # gr.Button("Run Evaluation", visible=True),
-        #                     # gr.DownloadButton(visible=False))
-        #     submit_btn.click(start_evaluation,
-        #                 inputs=[command_output, jsonl_file, subset, split],
-        #                 outputs=[log_output, download_btn])
     with gr.Row():
         with gr.Accordion("📙 Citation", open=False):

         with gr.TabItem("🚀 Request", id=4):
             gr.Markdown(SUBMISSION_TEXT_3)
+        with gr.TabItem("🛠️ Execute", id=5):
+            gr.Markdown("# BigCodeBench Evaluator")
+            with gr.Row():
+                jsonl_file = gr.File(label="Upload JSONL file", file_types=[".jsonl"])
+                split = gr.Dropdown(choices=["complete", "instruct"], label="Split", value="complete")
+                subset = gr.Dropdown(choices=["hard"], label="Subset", value="hard")
+            with gr.Row():
+                parallel = gr.Number(label="Parallel (optional)", precision=0)
+                min_time_limit = gr.Number(label="Min Time Limit", value=1, precision=1)
+                max_as_limit = gr.Number(label="Max AS Limit", value=25*1024, precision=0)
+            with gr.Row():
+                max_data_limit = gr.Number(label="Max Data Limit", value=25*1024, precision=0)
+                max_stack_limit = gr.Number(label="Max Stack Limit", value=10, precision=0)
+                check_gt_only = gr.Checkbox(label="Check GT Only")
+                no_gt = gr.Checkbox(label="No GT")
+            command_output = gr.Textbox(label="Command", value=default_command, interactive=False)
+            with gr.Row():
+                submit_btn = gr.Button("Run Evaluation")
+                download_btn = gr.DownloadButton(label="Download Result")
+            log_output = gr.Textbox(label="Execution Logs", lines=20)
+            input_components = [
+                jsonl_file, split, subset, parallel,
+                min_time_limit, max_as_limit, max_data_limit, max_stack_limit,
+                check_gt_only, no_gt
+            ]
+            for component in input_components:
+                component.change(generate_command, inputs=input_components, outputs=command_output)
+            def start_evaluation(command, jsonl_file, subset, split):
+                extra = subset + "_" if subset != "full" else ""
+                if jsonl_file is not None:
+                    result_path = os.path.basename(jsonl_file.name).replace(".jsonl", f"_{extra}eval_results.json")
+                else:
+                    result_path = None
+                for log in stream_logs(command, jsonl_file):
+                    if jsonl_file is not None:
+                        yield log, gr.update(value=result_path, label=result_path), gr.update()
+                    else:
+                        yield log, gr.update(), gr.update()
+                is_running = False
+                result_file = find_result_file()
+                if result_file:
+                    return gr.update(label="Evaluation completed. Result file found."), gr.update(value=result_file)
+                            # gr.Button(visible=False)#,
+                            # gr.DownloadButton(label="Download Result", value=result_file, visible=True))
+                else:
+                    return gr.update(label="Evaluation completed. No result file found."), gr.update(value=result_path)
+                            # gr.Button("Run Evaluation", visible=True),
+                            # gr.DownloadButton(visible=False))
+            submit_btn.click(start_evaluation,
+                        inputs=[command_output, jsonl_file, subset, split],
+                        outputs=[log_output, download_btn])
     with gr.Row():
         with gr.Accordion("📙 Citation", open=False):