Build

Paused

ManishThota commited on Feb 13

Commit

c52e238

•

1 Parent(s): 0c52e55

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,6 +6,14 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 #Setting device to cuda
 torch.set_default_device("cuda")
 # Initialize the model and tokenizer
 model = AutoModelForCausalLM.from_pretrained("ManishThota/Sparrow",
                                              torch_dtype=torch.float16,
@@ -39,7 +47,7 @@ iface = gr.Interface(
     fn=gradio_predict,
     inputs=[gr.Image(type="pil", label="Upload or Drag an Image"),
             gr.Textbox(label="Question", placeholder="e.g. What are the colors of the bus in the image?", scale=4),
-            gr.Slider(2, 100, value=25, label="Count", info="Choose between 2 and 100")],
     outputs=gr.TextArea(label="Answer"),
     title="Sparrow - Tiny 3B | Visual Question Answering",
     description="An interactive chat model that can answer questions about images in an Academic context. \n We can input images, and the system will analyze them to provide information about their contents. I've utilized this capability by feeding slides from PowerPoint presentations used in classes and the lecture content passed as text. Consequently, the model now mimics the behavior and responses of my professors. So, if I present any PowerPoint slide, it explains it just like my professor would, further it can be personalized.",

 #Setting device to cuda
 torch.set_default_device("cuda")
+# # Ensure GPU usage if available
+# device = "cuda" if torch.cuda.is_available() else "cpu"
+# torch.set_default_tensor_type('torch.cuda.FloatTensor' if device=='cuda' else 'torch.FloatTensor')
+torch.set_default_tensor_type('torch.cuda.FloatTensor')
 # Initialize the model and tokenizer
 model = AutoModelForCausalLM.from_pretrained("ManishThota/Sparrow",
                                              torch_dtype=torch.float16,
     fn=gradio_predict,
     inputs=[gr.Image(type="pil", label="Upload or Drag an Image"),
             gr.Textbox(label="Question", placeholder="e.g. What are the colors of the bus in the image?", scale=4),
+            gr.Slider(2, 100, value=25, label="Token Count", info="Choose between 2 and 100")],
     outputs=gr.TextArea(label="Answer"),
     title="Sparrow - Tiny 3B | Visual Question Answering",
     description="An interactive chat model that can answer questions about images in an Academic context. \n We can input images, and the system will analyze them to provide information about their contents. I've utilized this capability by feeding slides from PowerPoint presentations used in classes and the lecture content passed as text. Consequently, the model now mimics the behavior and responses of my professors. So, if I present any PowerPoint slide, it explains it just like my professor would, further it can be personalized.",