Spaces:

ivelin
/

ui-refexp

Runtime error

App Files Files Community

ivelin commited on Jan 9, 2023

Commit

a432919

1 Parent(s): dedc746

fix: cleanup

Browse files

Signed-off-by: ivelin <ivelin.eth@gmail.com>

Files changed (1) hide show

app.py +8 -11

app.py CHANGED Viewed

@@ -16,16 +16,13 @@ model.to(device)
 def process_refexp(image: Image, prompt: str):
-    # extract PIL image from Gradio Image component
-    pil_image = image.value
-    print(f"(image, prompt): {pil_image}, {prompt}")
     # trim prompt to 80 characters and normalize to lowercase
     prompt = prompt[:80].lower()
     # prepare encoder inputs
-    pixel_values = processor(pil_image, return_tensors="pt").pixel_values
     # prepare decoder inputs
     task_prompt = "<s_refexp><s_prompt>{user_input}</s_prompt><s_refexp>"
@@ -56,9 +53,9 @@ def process_refexp(image: Image, prompt: str):
     bbox = processor.token2json(sequence)
     print(f"predicted bounding box: {bbox}")
-    print(f"image object: {pil_image}")
-    print(f"image size: {pil_image.size}")
-    width, height = pil_image.size
     print(f"image width, height: {width, height}")
     print(f"prompt: {sample['prompt']}")
@@ -73,7 +70,7 @@ def process_refexp(image: Image, prompt: str):
     shape = [(xmin, ymin), (xmax, ymax)]
     # create rectangle image
-    img1 = ImageDraw.Draw(pil_image)
     img1.rectangle(shape, outline="green", width=5)
     return image, bbox
@@ -85,8 +82,8 @@ examples = [["example_1.jpg", "select the setting icon from top right corner"],
             ["example_2.jpg", "enter the text field next to the name"]]
 demo = gr.Interface(fn=process_refexp,
-                    inputs=["image", "text"],
-                    outputs=["image", "json"],
                     title=title,
                     description=description,
                     article=article,

 def process_refexp(image: Image, prompt: str):
+    print(f"(image, prompt): {image}, {prompt}")
     # trim prompt to 80 characters and normalize to lowercase
     prompt = prompt[:80].lower()
     # prepare encoder inputs
+    pixel_values = processor(image, return_tensors="pt").pixel_values
     # prepare decoder inputs
     task_prompt = "<s_refexp><s_prompt>{user_input}</s_prompt><s_refexp>"
     bbox = processor.token2json(sequence)
     print(f"predicted bounding box: {bbox}")
+    print(f"image object: {image}")
+    print(f"image size: {image.size}")
+    width, height = image.size
     print(f"image width, height: {width, height}")
     print(f"prompt: {sample['prompt']}")
     shape = [(xmin, ymin), (xmax, ymax)]
     # create rectangle image
+    img1 = ImageDraw.Draw(image)
     img1.rectangle(shape, outline="green", width=5)
     return image, bbox
             ["example_2.jpg", "enter the text field next to the name"]]
 demo = gr.Interface(fn=process_refexp,
+                    inputs=[gr.Image(type="pil"), "text"],
+                    outputs=[gr.Image(type="pil"), "json"],
                     title=title,
                     description=description,
                     article=article,