backend_demo

Paused

Shaltiel commited on Apr 7

Commit

a08a2d9

•

1 Parent(s): e40dcd5

Updated owner organization

Files changed (6) hide show

src/custom_tasks/heq_task.py CHANGED Viewed

@@ -9,6 +9,7 @@ from lighteval.tasks.requests import Doc
 from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
 def get_tokens(s):
     if not s:
@@ -105,7 +106,7 @@ heq_task = LightevalTaskConfig(
     name="heq-qa-tlnls",
     prompt_function="heq_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
-    hf_repo="dicta-hebrew-llm-leaderboard/tests",
     hf_subset="default",
     hf_avail_splits=["heq"],
     evaluation_splits=["heq"],

 from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
+from envs import OWNER
 def get_tokens(s):
     if not s:
     name="heq-qa-tlnls",
     prompt_function="heq_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
+    hf_repo=f"{OWNER}/tests",
     hf_subset="default",
     hf_avail_splits=["heq"],
     evaluation_splits=["heq"],

src/custom_tasks/sentiment_task.py CHANGED Viewed

@@ -9,6 +9,7 @@ from lighteval.tasks.requests import Doc
 from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
 def sentiment_eval_fn(golds: list[str], predictions: list[str], formatted_doc: Doc = None):
     if len(predictions)  > 1:
@@ -49,7 +50,7 @@ sentiment_task = LightevalTaskConfig(
     name="sentiment-acc",
     prompt_function="sentiment_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
-    hf_repo="dicta-hebrew-llm-leaderboard/tests",
     hf_subset="default",
     hf_avail_splits=["sentiment"],
     evaluation_splits=["sentiment"],

 from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
+from envs import OWNER
 def sentiment_eval_fn(golds: list[str], predictions: list[str], formatted_doc: Doc = None):
     if len(predictions)  > 1:
     name="sentiment-acc",
     prompt_function="sentiment_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
+    hf_repo=f"{OWNER}/tests",
     hf_subset="default",
     hf_avail_splits=["sentiment"],
     evaluation_splits=["sentiment"],

src/custom_tasks/translation_task.py CHANGED Viewed

@@ -10,6 +10,7 @@ from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
 import sacrebleu
 def trans_prompt_fn(line, task_name: str = None):
     """Defines how to go from a dataset line to a doc object.
@@ -45,7 +46,7 @@ translation_task = LightevalTaskConfig(
     name="he-en-trans-bleu",
     prompt_function="trans_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
-    hf_repo="dicta-hebrew-llm-leaderboard/tests",
     hf_subset="default",
     hf_avail_splits=["en2he", "he2en"],
     evaluation_splits=["en2he", "he2en"],

 import collections
 from lighteval.utils import as_list
 import sacrebleu
+from envs import OWNER
 def trans_prompt_fn(line, task_name: str = None):
     """Defines how to go from a dataset line to a doc object.
     name="he-en-trans-bleu",
     prompt_function="trans_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
+    hf_repo=f"{OWNER}/tests",
     hf_subset="default",
     hf_avail_splits=["en2he", "he2en"],
     evaluation_splits=["en2he", "he2en"],

src/custom_tasks/winograd_task.py CHANGED Viewed

@@ -9,6 +9,7 @@ from lighteval.tasks.requests import Doc
 from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
 def winograd_eval_fn(golds: list[str], predictions: list[str], formatted_doc: Doc = None):
     if len(predictions)  > 1:
@@ -46,7 +47,7 @@ winograd_task = LightevalTaskConfig(
     name="winograd-acc",
     prompt_function="winograd_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
-    hf_repo="dicta-hebrew-llm-leaderboard/tests",
     hf_subset="default",
     hf_avail_splits=["winograd"],
     evaluation_splits=["winograd"],

 from Levenshtein import distance
 import collections
 from lighteval.utils import as_list
+from envs import OWNER
 def winograd_eval_fn(golds: list[str], predictions: list[str], formatted_doc: Doc = None):
     if len(predictions)  > 1:
     name="winograd-acc",
     prompt_function="winograd_prompt_fn",  # must be defined in the file or imported from src/lighteval/tasks/tasks_prompt_formatting.py
     suite=["custom"],
+    hf_repo=f"{OWNER}/tests",
     hf_subset="default",
     hf_avail_splits=["winograd"],
     evaluation_splits=["winograd"],

src/envs.py CHANGED Viewed

@@ -6,7 +6,7 @@ from huggingface_hub import HfApi
 # ----------------------------------
 TOKEN = os.environ.get("HF_TOKEN") # A read/write token for your org
-OWNER = "dicta-hebrew-llm-leaderboard" # Change to your org - don't forget to create a results and request file
 # For harness evaluations
 DEVICE = "cpu" # "cuda:0" if you add compute, for harness evaluations

 # ----------------------------------
 TOKEN = os.environ.get("HF_TOKEN") # A read/write token for your org
+OWNER = "hebrew-llm-leaderboard" # Change to your org - don't forget to create a results and request file
 # For harness evaluations
 DEVICE = "cpu" # "cuda:0" if you add compute, for harness evaluations

src/logging.py CHANGED Viewed

@@ -22,7 +22,7 @@ def read_logs():
     # API.upload_file(
     #    path_or_fileobj="output.log",
     #    path_in_repo="backend.log",
-    #    repo_id="dicta-hebrew-llm-leaderboard/logs",
     #    repo_type="dataset",
     # )

     # API.upload_file(
     #    path_or_fileobj="output.log",
     #    path_in_repo="backend.log",
+    #    repo_id="hebrew-llm-leaderboard/logs",
     #    repo_type="dataset",
     # )