open_pt_llm_leaderboard

Running on CPU Upgrade

eduagarcia commited on Feb 6, 2024

Commit

79aba72

1 Parent(s): 1764c92

minor fixes

Files changed (2) hide show

src/leaderboard/read_evals.py CHANGED Viewed

@@ -75,6 +75,7 @@ class EvalResult:
             tasks = ORIGINAL_TASKS
         for task in tasks:
             benchmark, metric = task
             # We skip old mmlu entries
             wrong_mmlu_version = False
@@ -241,7 +242,7 @@ def get_raw_eval_results(results_path: str, requests_path: str, dynamic_path: st
             if v.status == "FINISHED" and not v.hidden:
                 v.to_dict() # we test if the dict version is complete
                 results.append(v)
-        except KeyError:  # not all eval values present
             continue
     return results

             tasks = ORIGINAL_TASKS
         for task in tasks:
             benchmark, metric = task
+            metric = metric + ',all'
             # We skip old mmlu entries
             wrong_mmlu_version = False
             if v.status == "FINISHED" and not v.hidden:
                 v.to_dict() # we test if the dict version is complete
                 results.append(v)
+        except KeyError as e:  # not all eval values present
             continue
     return results

src/scripts/update_all_request_files.py CHANGED Viewed

@@ -46,7 +46,8 @@ def update_models(file_path, models, original_leaderboard_files=None):
             # Is the model still on the hub?
             model_name = model_id
-            if model_cfg.card_data is not None and model_cfg.card_data.base_model is not None:
                 model_name = model_cfg.card_data.base_model # for adapters, we look at the parent model
             still_on_hub, _, _ = is_model_on_hub(
                 model_name=model_name, revision=data.get("revision"), trust_remote_code=True, test_tokenizer=False, token=H4_TOKEN

             # Is the model still on the hub?
             model_name = model_id
+            if model_cfg.card_data is not None and hasattr(model_cfg.card_data, "base_model") and model_cfg.card_data.base_model is not None:
                 model_name = model_cfg.card_data.base_model # for adapters, we look at the parent model
             still_on_hub, _, _ = is_model_on_hub(
                 model_name=model_name, revision=data.get("revision"), trust_remote_code=True, test_tokenizer=False, token=H4_TOKEN