Spaces:

aavetis
/

ugen-image-captioning

Running on Zero

aavetis commited on Dec 28, 2023

Commit

582a256

•

1 Parent(s): cdcc865

change input

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,13 +1,11 @@
 import gradio as gr
 from uform import gen_model
 from PIL import Image
-import requests
 # Load the model and processor
 model = gen_model.VLMForCausalLM.from_pretrained("unum-cloud/uform-gen")
 processor = gen_model.VLMProcessor.from_pretrained("unum-cloud/uform-gen")
 def generate_caption(image, prompt):
     # Process the image and the prompt
     inputs = processor(text=prompt, images=image, return_tensors="pt", padding=True)
@@ -18,18 +16,14 @@ def generate_caption(image, prompt):
     return caption
 # Load the demo image
 demo_image = Image.open("jungle-glass.png")
 # Define the Gradio interface
 iface = gr.Interface(
     fn=generate_caption,
-    inputs=[
-        gr.inputs.Image(type="pil", label="Upload Image", default=demo_image),
-        gr.inputs.Textbox(label="Prompt"),
-    ],
-    outputs=gr.outputs.Textbox(label="Generated Caption"),
 )
 # Launch the interface

 import gradio as gr
 from uform import gen_model
 from PIL import Image
 # Load the model and processor
 model = gen_model.VLMForCausalLM.from_pretrained("unum-cloud/uform-gen")
 processor = gen_model.VLMProcessor.from_pretrained("unum-cloud/uform-gen")
 def generate_caption(image, prompt):
     # Process the image and the prompt
     inputs = processor(text=prompt, images=image, return_tensors="pt", padding=True)
     return caption
 # Load the demo image
 demo_image = Image.open("jungle-glass.png")
 # Define the Gradio interface
 iface = gr.Interface(
     fn=generate_caption,
+    inputs=[gr.Image(type="pil", label="Upload Image", default=demo_image), gr.Textbox(label="Prompt")],
+    outputs=gr.Textbox(label="Generated Caption"),
 )
 # Launch the interface