Spaces:

aavetis
/

ugen-image-captioning

Running on Zero

fix example

26abb52 7 months ago

No virus

862 Bytes

	import gradio as gr
	from uform import gen_model
	from PIL import Image

	# Load the model and processor
	model = gen_model.VLMForCausalLM.from_pretrained("unum-cloud/uform-gen")
	processor = gen_model.VLMProcessor.from_pretrained("unum-cloud/uform-gen")

	def generate_caption(image, prompt):
	# Process the image and the prompt
	inputs = processor(text=prompt, images=image, return_tensors="pt", padding=True)

	# Generate the output
	outputs = model.generate(**inputs)
	caption = processor.decode(outputs[0], skip_special_tokens=True)

	return caption

	# Define the Gradio interface
	iface = gr.Interface(
	fn=generate_caption,
	inputs=[gr.Image(type="pil", label="Upload Image"), gr.Textbox(label="Prompt")],
	outputs=gr.Textbox(label="Generated Caption"),
	examples=[["jungle-glass.png", ""]]
	)

	# Launch the interface
	iface.launch()