deplot_plus_llm

Runtime error

App Files Files Community

fl399 commited on Apr 11, 2023

Commit

f2216d5

1 Parent(s): 56f3b9b

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -45

app.py CHANGED Viewed

@@ -66,54 +66,54 @@ A: Let's find the row of year 2007, that's Row 3. Let's extract the numbers on R
 ## alpaca-lora
-assert (
-    "LlamaTokenizer" in transformers._import_structure["models.llama"]
-), "LLaMA is now in HuggingFace's main branch.\nPlease reinstall it: pip uninstall transformers && pip install git+https://github.com/huggingface/transformers.git"
-from transformers import LlamaTokenizer, LlamaForCausalLM, GenerationConfig
-tokenizer = LlamaTokenizer.from_pretrained("decapoda-research/llama-7b-hf")
-BASE_MODEL = "decapoda-research/llama-7b-hf"
-LORA_WEIGHTS = "tloen/alpaca-lora-7b"
-if device == "cuda":
-    model = LlamaForCausalLM.from_pretrained(
-        BASE_MODEL,
-        load_in_8bit=False,
-        torch_dtype=torch.float16,
-        device_map="auto",
-    )
-    model = PeftModel.from_pretrained(
-        model, LORA_WEIGHTS, torch_dtype=torch.float16, force_download=True
-    )
-elif device == "mps":
-    model = LlamaForCausalLM.from_pretrained(
-        BASE_MODEL,
-        device_map={"": device},
-        torch_dtype=torch.float16,
-    )
-    model = PeftModel.from_pretrained(
-        model,
-        LORA_WEIGHTS,
-        device_map={"": device},
-        torch_dtype=torch.float16,
-    )
-else:
-    model = LlamaForCausalLM.from_pretrained(
-        BASE_MODEL, device_map={"": device}, low_cpu_mem_usage=True
-    )
-    model = PeftModel.from_pretrained(
-        model,
-        LORA_WEIGHTS,
-        device_map={"": device},
-    )
-if device != "cpu":
-    model.half()
-model.eval()
-if torch.__version__ >= "2":
-    model = torch.compile(model)
 ## FLAN-UL2
@@ -223,10 +223,17 @@ theme = gr.themes.Monochrome(
 with gr.Blocks(theme=theme) as demo:
     with gr.Column():
       gr.Markdown(
             """<h1><center>DePlot+LLM: Multimodal chain-of-thought reasoning on plots</center></h1>
             <p>
-            This is a demo of DePlot+LLM for QA and summarisation. <a href='https://arxiv.org/abs/2212.10505' target='_blank'>DePlot</a> is an image-to-text model that converts plots and charts into a textual sequence. The sequence then is used to prompt LLM for chain-of-thought reasoning. The current underlying LLMs are <a href='https://huggingface.co/spaces/tloen/alpaca-lora' target='_blank'>alpaca-lora</a>, <a href='https://huggingface.co/google/flan-ul2' target='_blank'>flan-ul2</a>, and <a href='https://openai.com/blog/chatgpt' target='_blank'>gpt-3.5-turbo</a>. To use it, simply upload your image and type a question or instruction and click 'submit', or click one of the examples to load them. Read more at the links below.
             </p>
             """
             )
@@ -236,7 +243,8 @@ with gr.Blocks(theme=theme) as demo:
         input_image = gr.Image(label="Input Image", type="pil", interactive=True)
         #input_image.style(height=512, width=512)
         instruction = gr.Textbox(placeholder="Enter your instruction/question...", label="Question/Instruction")
-        llm = gr.Dropdown(["alpaca-lora", "flan-ul2", "gpt-3.5-turbo"], label="LLM")
         openai_api_key_textbox = gr.Textbox(value='',
                                             placeholder="Paste your OpenAI API key (sk-...) and hit Enter (if using OpenAI models, otherwise leave empty)",
                                             show_label=False, lines=1, type='password')

 ## alpaca-lora
+# assert (
+#     "LlamaTokenizer" in transformers._import_structure["models.llama"]
+# ), "LLaMA is now in HuggingFace's main branch.\nPlease reinstall it: pip uninstall transformers && pip install git+https://github.com/huggingface/transformers.git"
+# from transformers import LlamaTokenizer, LlamaForCausalLM, GenerationConfig
+# tokenizer = LlamaTokenizer.from_pretrained("decapoda-research/llama-7b-hf")
+# BASE_MODEL = "decapoda-research/llama-7b-hf"
+# LORA_WEIGHTS = "tloen/alpaca-lora-7b"
+# if device == "cuda":
+#     model = LlamaForCausalLM.from_pretrained(
+#         BASE_MODEL,
+#         load_in_8bit=False,
+#         torch_dtype=torch.float16,
+#         device_map="auto",
+#     )
+#     model = PeftModel.from_pretrained(
+#         model, LORA_WEIGHTS, torch_dtype=torch.float16, force_download=True
+#     )
+# elif device == "mps":
+#     model = LlamaForCausalLM.from_pretrained(
+#         BASE_MODEL,
+#         device_map={"": device},
+#         torch_dtype=torch.float16,
+#     )
+#     model = PeftModel.from_pretrained(
+#         model,
+#         LORA_WEIGHTS,
+#         device_map={"": device},
+#         torch_dtype=torch.float16,
+#     )
+# else:
+#     model = LlamaForCausalLM.from_pretrained(
+#         BASE_MODEL, device_map={"": device}, low_cpu_mem_usage=True
+#     )
+#     model = PeftModel.from_pretrained(
+#         model,
+#         LORA_WEIGHTS,
+#         device_map={"": device},
+#     )
+# if device != "cpu":
+#     model.half()
+# model.eval()
+# if torch.__version__ >= "2":
+#     model = torch.compile(model)
 ## FLAN-UL2
 with gr.Blocks(theme=theme) as demo:
     with gr.Column():
+      # gr.Markdown(
+      #       """<h1><center>DePlot+LLM: Multimodal chain-of-thought reasoning on plots</center></h1>
+      #       <p>
+      #       This is a demo of DePlot+LLM for QA and summarisation. <a href='https://arxiv.org/abs/2212.10505' target='_blank'>DePlot</a> is an image-to-text model that converts plots and charts into a textual sequence. The sequence then is used to prompt LLM for chain-of-thought reasoning. The current underlying LLMs are <a href='https://huggingface.co/spaces/tloen/alpaca-lora' target='_blank'>alpaca-lora</a>, <a href='https://huggingface.co/google/flan-ul2' target='_blank'>flan-ul2</a>, and <a href='https://openai.com/blog/chatgpt' target='_blank'>gpt-3.5-turbo</a>. To use it, simply upload your image and type a question or instruction and click 'submit', or click one of the examples to load them. Read more at the links below.
+      #       </p>
+      #       """
+      #       )
       gr.Markdown(
             """<h1><center>DePlot+LLM: Multimodal chain-of-thought reasoning on plots</center></h1>
             <p>
+            This is a demo of DePlot+LLM for QA and summarisation. <a href='https://arxiv.org/abs/2212.10505' target='_blank'>DePlot</a> is an image-to-text model that converts plots and charts into a textual sequence. The sequence then is used to prompt LLM for chain-of-thought reasoning. The current underlying LLMs are <a href='https://huggingface.co/google/flan-ul2' target='_blank'>flan-ul2</a> and <a href='https://openai.com/blog/chatgpt' target='_blank'>gpt-3.5-turbo</a>. To use it, simply upload your image and type a question or instruction and click 'submit', or click one of the examples to load them. Read more at the links below.
             </p>
             """
             )
         input_image = gr.Image(label="Input Image", type="pil", interactive=True)
         #input_image.style(height=512, width=512)
         instruction = gr.Textbox(placeholder="Enter your instruction/question...", label="Question/Instruction")
+        #llm = gr.Dropdown(["alpaca-lora", "flan-ul2", "gpt-3.5-turbo"], label="LLM")
+          llm = gr.Dropdown(["flan-ul2", "gpt-3.5-turbo"], label="LLM")
         openai_api_key_textbox = gr.Textbox(value='',
                                             placeholder="Paste your OpenAI API key (sk-...) and hit Enter (if using OpenAI models, otherwise leave empty)",
                                             show_label=False, lines=1, type='password')