core_leaderboard

Running

App Files Files Community

benediktstroebl commited on Aug 12, 2024

Commit

eb2a754

1 Parent(s): 86a15ac

formatting and download fix

Browse files

Files changed (1) hide show

app.py +7 -7

app.py CHANGED Viewed

@@ -23,6 +23,7 @@ import weave
 from datetime import datetime
 weave.init(f'leaderboard_testing_{datetime.now().strftime("%Y%m%d%H%M%S")}')
 def restart_space():
     API.restart_space(repo_id=REPO_ID, token=HF_TOKEN)
@@ -31,7 +32,7 @@ def restart_space():
 def download_latest_results():
     print("Downloading latest results...")
     snapshot_download(RESULTS_REPO_ID,
-                    local_dir=abs_path / "evals_upload",
                     repo_type='dataset',
                     tqdm_class=None,
                     etag_timeout=30,
@@ -39,7 +40,6 @@ def download_latest_results():
                     )
     print("Download complete.")
-abs_path = Path(__file__).parent
 # Global variable to store preprocessed data
 preprocessed_traces = {}
@@ -305,21 +305,21 @@ with gr.Blocks() as demo:
         with gr.Tab("SWE-Bench"):
             with gr.Row():
-                with gr.Column(scale=1):
-                    scatter_plot = gr.Plot(create_scatter_plot(parse_json_files(os.path.join(abs_path, "evals_live"), 'swebench_lite'), "Total Cost", "Accuracy", "Total Cost (in USD)", "Accuracy", ["Agent Name"]))
-                with gr.Column(scale=1):
                     Leaderboard(
                         value=parse_json_files(os.path.join(abs_path, "evals_live"), 'swebench_lite'),
                         select_columns=SelectColumns(
-                            default_selection=config.SWEBENCH_ON_LOAD_COLUMNS,
                             cant_deselect=["Agent Name"],
                             label="Select Columns to Display:",
                         ),
-                        search_columns=config.SWEBENCH_SEARCH_COLUMNS,
                         column_widths={"Agent Name": 40,
                                        "Accuracy": 20,
                                        "Total Cost": 20},
                     )
         with gr.Tab("About"):
             gr.Markdown((Path(__file__).parent / "about.md").read_text())

 from datetime import datetime
 weave.init(f'leaderboard_testing_{datetime.now().strftime("%Y%m%d%H%M%S")}')
+abs_path = Path(__file__).parent
 def restart_space():
     API.restart_space(repo_id=REPO_ID, token=HF_TOKEN)
 def download_latest_results():
     print("Downloading latest results...")
     snapshot_download(RESULTS_REPO_ID,
+                    local_dir= "evals_upload",
                     repo_type='dataset',
                     tqdm_class=None,
                     etag_timeout=30,
                     )
     print("Download complete.")
 # Global variable to store preprocessed data
 preprocessed_traces = {}
         with gr.Tab("SWE-Bench"):
             with gr.Row():
+                with gr.Column(scale=2):
                     Leaderboard(
                         value=parse_json_files(os.path.join(abs_path, "evals_live"), 'swebench_lite'),
                         select_columns=SelectColumns(
+                            default_selection=config.USACO_ON_LOAD_COLUMNS,
                             cant_deselect=["Agent Name"],
                             label="Select Columns to Display:",
                         ),
+                        search_columns=config.USACO_SEARCH_COLUMNS,
                         column_widths={"Agent Name": 40,
                                        "Accuracy": 20,
                                        "Total Cost": 20},
                     )
+            with gr.Row():
+                scatter_plot = gr.Plot(create_scatter_plot(parse_json_files(os.path.join(abs_path, "evals_live"), 'swebench_lite'), "Total Cost", "Accuracy", "Total Cost (in USD)", "Accuracy", ["Agent Name"]))
         with gr.Tab("About"):
             gr.Markdown((Path(__file__).parent / "about.md").read_text())