Spaces:

Prakh24s
/

blip-api-personal

Sleeping

Prakh24s commited on Sep 29, 2023

Commit

fbfec82

•

1 Parent(s): 1a004cd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,9 +7,9 @@ model_id = "Salesforce/blip-image-captioning-base"
 model = BlipForConditionalGeneration.from_pretrained(model_id)
 processor = BlipProcessor.from_pretrained(model_id)
-def generate_caption(image_path):
-    # Load the image directly from the path
-    image = Image.open(image_path).convert('RGB')
     # Process the image to generate tensor inputs
     inputs = processor(image, return_tensors="pt")
@@ -20,6 +20,7 @@ def generate_caption(image_path):
     # Decode and return the generated caption
     return processor.decode(out[0], skip_special_tokens=True)
 # Gradio interface setup to accept image input and produce text output
 iface = gr.Interface(generate_caption, inputs="image", outputs="text")

 model = BlipForConditionalGeneration.from_pretrained(model_id)
 processor = BlipProcessor.from_pretrained(model_id)
+def generate_caption(image_array):
+    # Convert numpy array to PIL Image
+    image = Image.fromarray(image_array.astype('uint8')).convert('RGB')
     # Process the image to generate tensor inputs
     inputs = processor(image, return_tensors="pt")
     # Decode and return the generated caption
     return processor.decode(out[0], skip_special_tokens=True)
 # Gradio interface setup to accept image input and produce text output
 iface = gr.Interface(generate_caption, inputs="image", outputs="text")