Spaces:

open-llm-leaderboard
/

open_llm_leaderboard

Restarting on CPU Upgrade

App Files Files Community

764

alozowski commited on 30 days ago

Commit

87e47c2

•

1 Parent(s): 9b133aa

Updated app.py download_dataset function

Browse files

Files changed (3) hide show

app.py +15 -11
src/populate.py +0 -1
src/tools/collections.py +1 -1

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import os
 import logging
 import gradio as gr
 import pandas as pd
@@ -56,13 +57,12 @@ enable_space_ci()
 def restart_space():
     API.restart_space(repo_id=REPO_ID, token=H4_TOKEN)
-def download_dataset(repo_id, local_dir, repo_type="dataset", max_attempts=3):
-    """Attempt to download dataset with retries."""
     attempt = 0
     while attempt < max_attempts:
         try:
-            print(f"Downloading {repo_id} to {local_dir}")
             snapshot_download(
                 repo_id=repo_id,
                 local_dir=local_dir,
@@ -71,21 +71,25 @@ def download_dataset(repo_id, local_dir, repo_type="dataset", max_attempts=3):
                 etag_timeout=30,
                 max_workers=8,
             )
             return
         except Exception as e:
-            logging.error(f"Error downloading {repo_id}: {e}")
             attempt += 1
-            if attempt == max_attempts:
-                restart_space()
 def init_space(full_init: bool = True):
     """Initializes the application space, loading only necessary data."""
     if full_init:
         # These downloads only occur on full initialization
-        download_dataset(QUEUE_REPO, EVAL_REQUESTS_PATH)
-        download_dataset(DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH)
-        download_dataset(RESULTS_REPO, EVAL_RESULTS_PATH)
     # Always retrieve the leaderboard DataFrame
     raw_data, original_df = get_leaderboard_df(

 import os
+import time
 import logging
 import gradio as gr
 import pandas as pd
 def restart_space():
     API.restart_space(repo_id=REPO_ID, token=H4_TOKEN)
+def download_dataset(repo_id, local_dir, repo_type="dataset", max_attempts=3, backoff_factor=1.5):
+    """Download dataset with exponential backoff retries."""
     attempt = 0
     while attempt < max_attempts:
         try:
+            logging.info(f"Downloading {repo_id} to {local_dir}")
             snapshot_download(
                 repo_id=repo_id,
                 local_dir=local_dir,
                 etag_timeout=30,
                 max_workers=8,
             )
+            logging.info("Download successful")
             return
         except Exception as e:
+            wait_time = backoff_factor ** attempt
+            logging.error(f"Error downloading {repo_id}: {e}, retrying in {wait_time}s")
+            time.sleep(wait_time)
             attempt += 1
+    raise Exception(f"Failed to download {repo_id} after {max_attempts} attempts")
 def init_space(full_init: bool = True):
     """Initializes the application space, loading only necessary data."""
     if full_init:
         # These downloads only occur on full initialization
+        try:
+            download_dataset(QUEUE_REPO, EVAL_REQUESTS_PATH)
+            download_dataset(DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH)
+            download_dataset(RESULTS_REPO, EVAL_RESULTS_PATH)
+        except Exception:
+            restart_space()
     # Always retrieve the leaderboard DataFrame
     raw_data, original_df = get_leaderboard_df(

src/populate.py CHANGED Viewed

@@ -52,4 +52,3 @@ def get_leaderboard_df(results_path, requests_path, dynamic_path, cols, benchmar
     df = df[cols].round(decimals=2)
     df = df[has_no_nan_values(df, benchmark_cols)]
     return raw_data, df

     df = df[cols].round(decimals=2)
     df = df[has_no_nan_values(df, benchmark_cols)]
     return raw_data, df

src/tools/collections.py CHANGED Viewed

@@ -73,4 +73,4 @@ def update_collections(df: DataFrame):
         try:
             delete_collection_item(collection_slug=PATH_TO_COLLECTION, item_object_id=item_id, token=H4_TOKEN)
         except HfHubHTTPError:
-            continue

         try:
             delete_collection_item(collection_slug=PATH_TO_COLLECTION, item_object_id=item_id, token=H4_TOKEN)
         except HfHubHTTPError:
+            continue