Spaces:

arad1367
/

GroqLLaVAMA_Econometrics_Agent

App Files Files Community

GroqLLaVAMA_Econometrics_Agent / app.py

arad1367

Update app.py

84154f2 verified about 2 months ago

raw

history blame contribute delete

6.28 kB

	# 1. Imports and API setup
	import gradio as gr
	from groq import Groq
	import base64
	import os

	# Define models used in the process
	llava_model = 'llava-v1.5-7b-4096-preview'
	llama31_model = 'llama-3.1-70b-versatile'

	# Image encoding function
	def encode_image(image_path):
	with open(image_path, "rb") as image_file:
	return base64.b64encode(image_file.read()).decode('utf-8')

	# Image to text function
	def image_to_text(client, model, base64_image, prompt):
	try:
	chat_completion = client.chat.completions.create(
	messages=[
	{
	"role": "user",
	"content": [
	{"type": "text", "text": prompt},
	{
	"type": "image_url",
	"image_url": {
	"url": f"data:image/jpeg;base64,{base64_image}",
	},
	},
	],
	}
	],
	model=model
	)
	return chat_completion.choices[0].message.content
	except Exception as e:
	if 'Invalid API Key' in str(e):
	return "Please enter a correct API key and try again."
	return f"Error generating text from image: {str(e)}"

	# Technical review generation function
	def technical_review_generation(client, image_description):
	keywords = ["econometrics", "finance", "marketing", "stock", "prediction", "chart", "graph", "time series"]
	if not any(keyword in image_description.lower() for keyword in keywords):
	return "The image is not related to the area this app covers. Please input a relevant image."

	try:
	chat_completion = client.chat.completions.create(
	messages=[
	{
	"role": "system",
	"content": "You are a professional econometrics. Write a complete review and report about the scene depicted in this image.",
	},
	{
	"role": "user",
	"content": image_description,
	}
	],
	model=llama31_model
	)
	return chat_completion.choices[0].message.content
	except Exception as e:
	return f"Error generating report: {str(e)}"

	# Main function for Gradio interface
	def process_image(api_key, image, prompt="Describe this image in detail."):
	# Set the API key
	try:
	os.environ["GROQ_API_KEY"] = api_key
	client = Groq() # Initialize the Groq client with the provided key
	except Exception as e:
	return "Please enter a correct API key and try again.", ""

	# Encode the image
	base64_image = encode_image(image)

	# Get image description from the model
	image_description = image_to_text(client, llava_model, base64_image, prompt)

	# If API key was invalid, only return the API key error message
	if "Please enter a correct API key and try again." in image_description:
	return image_description, ""

	# Generate the econometrics report based on the image description
	report = technical_review_generation(client, image_description)

	# Return both image description and the econometrics report
	return f"--- Image Description ---\n{image_description}", f"--- GroqLLaVAMA EconoMind Report ---\n{report}"

	# Define CSS for centering elements and footer styling
	css = """
	#title, #description {
	text-align: center;
	margin: 20px;
	}
	#footer {
	text-align: center;
	margin-top: 30px;
	padding: 10px;
	font-size: 14px;
	}
	.gradio-container {
	display: flex;
	flex-direction: column;
	align-items: center;
	}
	.gradio-row {
	width: 100%;
	display: flex;
	justify-content: center;
	}
	.clear-button {
	margin-top: 10px;
	}
	"""

	# Gradio Interface
	def gradio_interface():
	# Define the footer HTML
	footer = """
	<div id="footer">
	<a href="https://www.linkedin.com/in/pejman-ebrahimi-4a60151a7/" target="_blank">LinkedIn</a> \|
	<a href="https://github.com/arad1367" target="_blank">GitHub</a> \|
	<a href="https://arad1367.pythonanywhere.com/" target="_blank">Live demo of my PhD defense</a> \|
	<a href="https://groq.com/introducing-llava-v1-5-7b-on-groqcloud-unlocking-the-power-of-multimodal-ai/" target="_blank">Introducing LLaVA V1.5 7B on GroqCloud</a>
	<br>
	Made with 💖 by Pejman Ebrahimi
	</div>
	"""

	with gr.Blocks(theme="gradio/soft", css=css) as demo:
	gr.HTML("<h1 id='title'>GroqLLaVAMA Econometrics Agent</h1>")
	gr.HTML("<p id='description'>Upload an economic chart and get a detailed analysis using Groq + LLaVA V1.5 7B multimodal + llama-3.1-70b.</p>")
	gr.DuplicateButton(value="Duplicate Space for private use", elem_classes="duplicate-button")

	with gr.Row():
	api_key_input = gr.Textbox(label="GROQ API Key", placeholder="Enter your GROQ API Key", type="password")
	with gr.Row():
	image_input = gr.Image(type="filepath", label="Upload an Image") # Changed type to 'filepath'
	with gr.Row():
	report_button = gr.Button("Generate Report")
	with gr.Row():
	output_description = gr.Textbox(label="Image Description", lines=10, elem_id="description-box")
	output_report = gr.Textbox(label="Report", lines=10, elem_id="report-box")

	# Define the interaction between inputs and outputs
	report_button.click(
	fn=process_image,
	inputs=[api_key_input, image_input],
	outputs=[output_description, output_report]
	)

	# Add footer HTML
	gr.HTML(footer)

	# Add clear button
	def clear_inputs():
	return "", None, "", ""

	with gr.Row():
	clear_button = gr.Button("Clear", elem_id="clear-button")
	clear_button.click(
	fn=clear_inputs,
	inputs=[],
	outputs=[api_key_input, image_input, output_description, output_report]
	)

	# Launch the interface
	demo.launch()

	# Start the Gradio interface
	gradio_interface()