Spaces:

autoevaluate
/

model-evaluator

Runtime error

App Files Files

xet

Community

lewtun HF Staff commited on Apr 29, 2022

Commit

8dec3b6

1 Parent(s): 160673c

Refactor task names

Browse files

Files changed (2) hide show

app.py +4 -20
utils.py +14 -1

app.py CHANGED Viewed

@@ -29,19 +29,6 @@ TASK_TO_ID = {
     # "single_column_regression": 10,
 }
-AUTOTRAIN_TASK_TO_HUB_TASK = {
-    "binary_classification": "text-classification",
-    "multi_class_classification": "text-classification",
-    # "multi_label_classification": "text-classification", # Not fully supported in AutoTrain
-    "entity_extraction": "token-classification",
-    "extractive_question_answering": "question-answering",
-    "translation": "translation",
-    "summarization": "summarization",
-    # "single_column_regression": 10,
-}
-HUB_TASK_TO_AUTOTRAIN_TASK = {v: k for k, v in AUTOTRAIN_TASK_TO_HUB_TASK.items()}
 ###########
 ### APP ###
 ###########
@@ -74,7 +61,7 @@ if metadata is None:
 with st.expander("Advanced configuration"):
     ## Select task
-    selected_task = st.selectbox("Select a task", list(AUTOTRAIN_TASK_TO_HUB_TASK.values()))
     ### Select config
     configs = get_dataset_config_names(selected_dataset)
     selected_config = st.selectbox("Select a config", configs)
@@ -84,9 +71,7 @@ with st.expander("Advanced configuration"):
     if splits_resp.status_code == 200:
         split_names = []
         all_splits = splits_resp.json()
-        print(all_splits)
         for split in all_splits["splits"]:
-            print(selected_config)
             if split["config"] == selected_config:
                 split_names.append(split["split"])
@@ -120,7 +105,7 @@ with st.expander("Advanced configuration"):
     # TODO: make it task specific
     col_mapping = {}
     with col1:
-        if selected_task == "text-classification":
             st.markdown("`text` column")
             st.text("")
             st.text("")
@@ -153,11 +138,10 @@ with st.form(key="form"):
     if submit_button:
         project_id = str(uuid.uuid4())[:3]
-        autotrain_task_name = HUB_TASK_TO_AUTOTRAIN_TASK[selected_task]
         payload = {
             "username": AUTOTRAIN_USERNAME,
             "proj_name": f"my-eval-project-{project_id}",
-            "task": TASK_TO_ID[autotrain_task_name],
             "config": {
                 "language": "en",
                 "max_models": 5,
@@ -181,7 +165,7 @@ with st.form(key="form"):
         if project_json_resp["created"]:
             payload = {
-                "split": 4,
                 "col_mapping": col_mapping,
                 "load_config": {"max_size_bytes": 0, "shuffle": False},
             }

     # "single_column_regression": 10,
 }
 ###########
 ### APP ###
 ###########
 with st.expander("Advanced configuration"):
     ## Select task
+    selected_task = st.selectbox("Select a task", list(TASK_TO_ID.keys()))
     ### Select config
     configs = get_dataset_config_names(selected_dataset)
     selected_config = st.selectbox("Select a config", configs)
     if splits_resp.status_code == 200:
         split_names = []
         all_splits = splits_resp.json()
         for split in all_splits["splits"]:
             if split["config"] == selected_config:
                 split_names.append(split["split"])
     # TODO: make it task specific
     col_mapping = {}
     with col1:
+        if selected_task in ["binary_classification", "multi_class_classification"]:
             st.markdown("`text` column")
             st.text("")
             st.text("")
     if submit_button:
         project_id = str(uuid.uuid4())[:3]
         payload = {
             "username": AUTOTRAIN_USERNAME,
             "proj_name": f"my-eval-project-{project_id}",
+            "task": TASK_TO_ID[selected_task],
             "config": {
                 "language": "en",
                 "max_models": 5,
         if project_json_resp["created"]:
             payload = {
+                "split": 4,  # use "auto" split choice in AutoTrain
                 "col_mapping": col_mapping,
                 "load_config": {"max_size_bytes": 0, "shuffle": False},
             }

utils.py CHANGED Viewed

@@ -3,6 +3,19 @@ from typing import Dict, Union
 import requests
 from huggingface_hub import DatasetFilter, HfApi, ModelFilter
 api = HfApi()
@@ -44,6 +57,6 @@ def get_metadata(dataset_name: str) -> Union[Dict, None]:
 def get_compatible_models(task, dataset_name):
-    filt = ModelFilter(task=task, trained_dataset=dataset_name, library="transformers")
     compatible_models = api.list_models(filter=filt)
     return [model.modelId for model in compatible_models]

 import requests
 from huggingface_hub import DatasetFilter, HfApi, ModelFilter
+AUTOTRAIN_TASK_TO_HUB_TASK = {
+    "binary_classification": "text-classification",
+    "multi_class_classification": "text-classification",
+    # "multi_label_classification": "text-classification", # Not fully supported in AutoTrain
+    "entity_extraction": "token-classification",
+    "extractive_question_answering": "question-answering",
+    "translation": "translation",
+    "summarization": "summarization",
+    # "single_column_regression": 10,
+}
+HUB_TASK_TO_AUTOTRAIN_TASK = {v: k for k, v in AUTOTRAIN_TASK_TO_HUB_TASK.items()}
 api = HfApi()
 def get_compatible_models(task, dataset_name):
+    filt = ModelFilter(task=AUTOTRAIN_TASK_TO_HUB_TASK[task], trained_dataset=dataset_name, library="transformers")
     compatible_models = api.list_models(filter=filt)
     return [model.modelId for model in compatible_models]