Spaces:

jayparmar0109
/

GenerativeAI-Business_Card_Reader

Running

App Files Files Community

GenerativeAI-Business_Card_Reader / app.py

jayparmar0109

Update app.py

34c1556 about 1 year ago

raw

history blame contribute delete

2.34 kB

	import streamlit as st
	import os
	import pathlib
	import textwrap
	from PIL import Image

	import google.generativeai as genai

	api_key = os.getenv("GEMINI_API_KEY")
	genai.configure(api_key=api_key)

	## Function to load OpenAI model and get respones
	def get_gemini_response(input,image,prompt):
	model = genai.GenerativeModel('gemini-pro-vision')
	response = model.generate_content([input,image[0],prompt])
	return response.text

	def input_image_setup(uploaded_file): # Check if a file has been uploaded
	if uploaded_file is not None: # Read the file into bytes
	bytes_data = uploaded_file.getvalue()
	image_parts = [
	{
	"mime_type": uploaded_file.type, # Get the mime type of the uploaded file
	"data": bytes_data
	}
	]
	return image_parts
	else:
	raise FileNotFoundError("No file uploaded")

	st.set_page_config(page_title="Gemini Image Demo")

	st.header("Generative AI : Business Card Reader")
	st.caption("""This space is based on Google generative ai API and it uses Gemini pro vision model
	to extract text from business card images. You can use your own images for input
	or find sample images in example folder of files section in this space.
	You can add input prompt below if you want to get specific imnformation from image.
	You can modify this space for other input like invoice.""")
	uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "jpeg", "png"])
	image=""
	if uploaded_file is not None:
	image = Image.open(uploaded_file)
	st.image(image, caption="Uploaded Image.", use_column_width=True)
	input=st.text_input("Input Prompt (Optinal) : ",key="input")

	submit=st.button("Submit")

	input_prompt ="""
	You are an expert in understanding business cards.
	Input: Image of a business card.
	Task: Extract and label the following information in JSON format:
	Labels : person_name, company_name, occupation, contact_number, email addresse, website, address, other_details (services, features, etc.)
	Constraints: Do not include missing information.
	"""

	if submit:
	image_data = input_image_setup(uploaded_file)
	response = get_gemini_response(input_prompt,image_data,input)
	st.subheader("Output :")
	st.write(response)