idefics_and_chatty

Runtime error

App Files Files Community

VictorSanh commited on Mar 19, 2024

Commit

a7d545f

•

1 Parent(s): 5e5d5d1

add 286 mix6 table

Browse files

Files changed (1) hide show

app_dialogue.py +11 -4

app_dialogue.py CHANGED Viewed

@@ -25,20 +25,27 @@ subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENT
 DEVICE = torch.device("cuda")
 MODELS = {
-    "HuggingFaceM4/idefics2-neftune": AutoModelForCausalLM.from_pretrained(
         "HuggingFaceM4/idefics2",
         trust_remote_code=True,
         torch_dtype=torch.bfloat16,
         token=os.environ["HF_AUTH_TOKEN"],
         revision="1e05755c1c5cb2077a0f60b83ea1368c22a17282",
     ).to(DEVICE),
-    "HuggingFaceM4/idefics2": AutoModelForCausalLM.from_pretrained(
         "HuggingFaceM4/idefics2",
         trust_remote_code=True,
         torch_dtype=torch.bfloat16,
         token=os.environ["HF_AUTH_TOKEN"],
         revision="5cd3c3a3eb5e0ea664f5ac09e73c9ef42da93a86",
     ).to(DEVICE),
 }
 PROCESSOR = AutoProcessor.from_pretrained(
     "HuggingFaceM4/idefics2",
@@ -331,7 +338,7 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
     with gr.Row(elem_id="model_selector_row"):
         model_selector = gr.Dropdown(
             choices=MODELS.keys(),
-            value="HuggingFaceM4/idefics2",
             interactive=True,
             show_label=False,
             container=False,
@@ -520,7 +527,7 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
         Same as `model_inference` but in greedy mode and with the 80b-instruct.
         Specifically for pre-computing the default examples.
         """
-        model_selector = "HuggingFaceM4/idefics2"
         user_prompt_str = message
         chat_history = []
         max_new_tokens = 512

 DEVICE = torch.device("cuda")
 MODELS = {
+    "284 - neftune - opt 18'500": AutoModelForCausalLM.from_pretrained(
         "HuggingFaceM4/idefics2",
         trust_remote_code=True,
         torch_dtype=torch.bfloat16,
         token=os.environ["HF_AUTH_TOKEN"],
         revision="1e05755c1c5cb2077a0f60b83ea1368c22a17282",
     ).to(DEVICE),
+    "279bis - baseline - opt 18'500": AutoModelForCausalLM.from_pretrained(
         "HuggingFaceM4/idefics2",
         trust_remote_code=True,
         torch_dtype=torch.bfloat16,
         token=os.environ["HF_AUTH_TOKEN"],
         revision="5cd3c3a3eb5e0ea664f5ac09e73c9ef42da93a86",
     ).to(DEVICE),
+    "286 - mix6 tables - opt 20'000": AutoModelForCausalLM.from_pretrained(
+        "HuggingFaceM4/idefics2",
+        trust_remote_code=True,
+        torch_dtype=torch.bfloat16,
+        token=os.environ["HF_AUTH_TOKEN"],
+        revision="b473d49caa964991b40b79fe7cb27d51d4d023f6",
+    ).to(DEVICE),
 }
 PROCESSOR = AutoProcessor.from_pretrained(
     "HuggingFaceM4/idefics2",
     with gr.Row(elem_id="model_selector_row"):
         model_selector = gr.Dropdown(
             choices=MODELS.keys(),
+            value="284 - neftune - opt 18'500",
             interactive=True,
             show_label=False,
             container=False,
         Same as `model_inference` but in greedy mode and with the 80b-instruct.
         Specifically for pre-computing the default examples.
         """
+        model_selector = "284 - neftune - opt 18'500"
         user_prompt_str = message
         chat_history = []
         max_new_tokens = 512