data_only_hallucination_leaderboard

Runtime error

App Files Files Community

pminervini commited on Dec 3, 2023

Commit

d489aeb

•

1 Parent(s): 83d660d

update

Browse files

Files changed (5) hide show

app.py +0 -0
backend-cli.py +2 -0
src/backend/manage_requests.py +2 -1
src/submission/check_validity.py +7 -3
submit-cli.py +152 -0

app.py CHANGED Viewed

File without changes

backend-cli.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import os
 import json

+#!/usr/bin/env python
 import os
 import json

src/backend/manage_requests.py CHANGED Viewed

@@ -82,7 +82,8 @@ def get_eval_requests(job_status: list, local_dir: str, hf_repo: str) -> list[Ev
             # breakpoint()
             data["json_filepath"] = json_filepath
-            del data['job_id']
             eval_request = EvalRequest(**data)
             eval_requests.append(eval_request)

             # breakpoint()
             data["json_filepath"] = json_filepath
+            if 'job_id' in data:
+                del data['job_id']
             eval_request = EvalRequest(**data)
             eval_requests.append(eval_request)

src/submission/check_validity.py CHANGED Viewed

@@ -41,14 +41,17 @@ def is_model_on_hub(model_name: str, revision: str, token: str = None, trust_rem
     try:
         config = AutoConfig.from_pretrained(model_name, revision=revision, trust_remote_code=trust_remote_code, token=token)
         if test_tokenizer:
-            tokenizer_config = get_tokenizer_config(model_name)
             if tokenizer_config is not None:
                 tokenizer_class_candidate = tokenizer_config.get("tokenizer_class", None)
             else:
-                tokenizer_class_candidate = config.tokenizer_class
-            tokenizer_class = tokenizer_class_from_name(tokenizer_class_candidate)
             if tokenizer_class is None:
                 return (
                     False,
@@ -65,6 +68,7 @@ def is_model_on_hub(model_name: str, revision: str, token: str = None, trust_rem
         )
     except Exception as e:
         return False, "was not found on hub!", None

     try:
         config = AutoConfig.from_pretrained(model_name, revision=revision, trust_remote_code=trust_remote_code, token=token)
         if test_tokenizer:
+            tokenizer_config = get_tokenizer_config(model_name)
             if tokenizer_config is not None:
                 tokenizer_class_candidate = tokenizer_config.get("tokenizer_class", None)
             else:
+                tokenizer_class_candidate = config.tokenizer_class
+            tokenizer_class = None
+            if tokenizer_class_candidate is not None:
+                tokenizer_class = tokenizer_class_from_name(tokenizer_class_candidate)
             if tokenizer_class is None:
                 return (
                     False,
         )
     except Exception as e:
+        print('XXX', e)
         return False, "was not found on hub!", None

submit-cli.py ADDED Viewed

	@@ -0,0 +1,152 @@

+#!/usr/bin/env python
+import json
+import os
+from datetime import datetime, timezone
+from src.envs import API, EVAL_REQUESTS_PATH, H4_TOKEN, QUEUE_REPO
+from src.submission.check_validity import already_submitted_models, check_model_card, get_model_size, is_model_on_hub
+def add_new_eval(model: str, base_model: str, revision: str, precision: str, private: bool, weight_type: str, model_type: str):
+    REQUESTED_MODELS, USERS_TO_SUBMISSION_DATES = already_submitted_models(EVAL_REQUESTS_PATH)
+    user_name = ""
+    model_path = model
+    if "/" in model:
+        tokens = model.split("/")
+        user_name = tokens[0]
+        model_path = tokens[1]
+    precision = precision.split(" ")[0]
+    current_time = datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")
+    if model_type is None or model_type == "":
+        return print("Please select a model type.")
+    # Does the model actually exist?
+    if revision == "":
+        revision = "main"
+    # Is the model on the hub?
+    if weight_type in ["Delta", "Adapter"]:
+        base_model_on_hub, error, _ = is_model_on_hub(model_name=base_model, revision=revision, token=H4_TOKEN, test_tokenizer=True)
+        if not base_model_on_hub:
+            print(f'Base model "{base_model}" {error}')
+            return
+    if not weight_type == "Adapter":
+        model_on_hub, error, _ = is_model_on_hub(model_name=model, revision=revision, test_tokenizer=True)
+        if not model_on_hub:
+            print(f'Model "{model}" {error}')
+            return
+    # Is the model info correctly filled?
+    try:
+        model_info = API.model_info(repo_id=model, revision=revision)
+    except Exception:
+        print("Could not get your model information. Please fill it up properly.")
+        return
+    model_size = get_model_size(model_info=model_info, precision=precision)
+    license = 'none'
+    try:
+        license = model_info.cardData["license"]
+    except Exception:
+        print("Please select a license for your model")
+        # return
+    # modelcard_OK, error_msg = check_model_card(model)
+    # if not modelcard_OK:
+    #     print(error_msg)
+    #     return
+    # Seems good, creating the eval
+    print("Adding new eval")
+    eval_entry = {
+        "model": model,
+        "base_model": base_model,
+        "revision": revision,
+        "private": private,
+        "precision": precision,
+        "weight_type": weight_type,
+        "status": "PENDING",
+        "submitted_time": current_time,
+        "model_type": model_type,
+        "likes": model_info.likes,
+        "params": model_size,
+        "license": license,
+    }
+    # Check for duplicate submission
+    if f"{model}_{revision}_{precision}" in REQUESTED_MODELS:
+        print("This model has been already submitted.")
+        return
+    print("Creating eval file")
+    OUT_DIR = f"{EVAL_REQUESTS_PATH}/{user_name}"
+    os.makedirs(OUT_DIR, exist_ok=True)
+    out_path = f"{OUT_DIR}/{model_path}_eval_request_{private}_{precision}_{weight_type}.json"
+    with open(out_path, "w") as f:
+        f.write(json.dumps(eval_entry))
+    print("Uploading eval file")
+    API.upload_file(path_or_fileobj=out_path, path_in_repo=out_path.split("eval-queue/")[1],
+                    repo_id=QUEUE_REPO, repo_type="dataset", commit_message=f"Add {model} to eval queue")
+    # Remove the local file
+    os.remove(out_path)
+    print("Your request has been submitted to the evaluation queue!\nPlease wait for up to an hour for the model to show in the PENDING list.")
+    return
+def main():
+    from huggingface_hub import HfApi
+    api = HfApi()
+    model_lst = api.list_models()
+    model_lst = [m for m in model_lst]
+    def custom_filter(m) -> bool:
+        return m.pipeline_tag in {'text-generation'} and 'en' in m.tags and m.private is False
+    filtered_model_lst = sorted([m for m in model_lst if custom_filter(m)], key=lambda m: m.downloads, reverse=True)
+    for i in range(min(50, len(filtered_model_lst))):
+        model = filtered_model_lst[i]
+        print(f'Considering {model.id} ..')
+        from huggingface_hub import snapshot_download
+        from src.backend.envs import EVAL_REQUESTS_PATH_BACKEND
+        from src.backend.manage_requests import get_eval_requests
+        from src.backend.manage_requests import EvalRequest
+        snapshot_download(repo_id=QUEUE_REPO, revision="main", local_dir=EVAL_REQUESTS_PATH_BACKEND, repo_type="dataset", max_workers=60)
+        PENDING_STATUS = "PENDING"
+        RUNNING_STATUS = "RUNNING"
+        FINISHED_STATUS = "FINISHED"
+        FAILED_STATUS = "FAILED"
+        status = [PENDING_STATUS, RUNNING_STATUS, FINISHED_STATUS, FAILED_STATUS]
+        # Get all eval request that are FINISHED, if you want to run other evals, change this parameter
+        eval_requests: list[EvalRequest] = get_eval_requests(job_status=status, hf_repo=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH_BACKEND)
+        requested_model_names = {e.model for e in eval_requests}
+        if model.id not in requested_model_names:
+            add_new_eval(model=model.id, base_model='', revision='main', precision='float32', private=False, weight_type='Original', model_type='pretrained')
+        else:
+            print(f'Model {model.id} already added, not adding it to the queue again.')
+if __name__ == "__main__":
+    main()