Spaces:

matejmicek
/

attentionborrow

Sleeping

App Files Files Community

attentionborrow / app.py

matejmicek

Create app.py

bb971e5 11 months ago

raw

history blame

No virus

3.06 kB

	import streamlit as st


	import os
	from openai import OpenAI
	import openai
	import base64

	import time
	import errno
	from elevenlabs import generate, play, voices


	from elevenlabs import voices, set_api_key
	set_api_key("8f73d4bd2ab582e4950964e5ecb12aaa")



	voice = voices()[-1]

	client = OpenAI(api_key='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')


	def encode_image(image_path):
	while True:
	try:
	with open(image_path, "rb") as image_file:
	return base64.b64encode(image_file.read()).decode("utf-8")
	except IOError as e:
	if e.errno != errno.EACCES:
	# Not a "file in use" error, re-raise
	raise
	# File is being written to, wait a bit and retry
	time.sleep(0.1)


	def generate_new_line(base64_image):
	return [
	{
	"role": "user",
	"content": [
	{"type": "text", "text": "Describe this image"},
	{
	"type": "image_url",
	"image_url": f"data:image/jpeg;base64,{base64_image}",
	},
	],
	},
	]

	def analyze_image(base64_image):
	response = client.chat.completions.create(
	model="gpt-4-vision-preview",
	messages=[
	{
	"role": "system",
	"content": """
	You are Sir David Attenborough. Narrate the picture of the human as if it is a nature documentary.
	Make it snarky and funny. Don't repeat yourself. Make it short. If I do anything remotely interesting, make a big deal about it!
	""",
	},
	]
	+ generate_new_line(base64_image),
	max_tokens=500,
	)
	response_text = response.choices[0].message.content
	return response_text


	from io import BytesIO
	import os

	def save_uploaded_file(uploaded_file):
	# Create a directory to save the file
	save_path = 'uploaded_images'
	if not os.path.exists(save_path):
	os.makedirs(save_path)

	# Save the file
	with open(os.path.join(save_path, 'temp'), "wb") as f:
	f.write(uploaded_file.getbuffer())

	return os.path.join(save_path, 'temp')

	def process():
	pass # Assuming 'process' is defined in 'your_processing_module'

	def main():
	st.title("Image to Audio Converter")

	# Image upload
	uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "png", "jpeg"])
	if uploaded_file:
	path = save_uploaded_file(uploaded_file)
	print(f'file saved to {path}')

	encoded_image = encode_image(path)
	print('image encoded')
	analyzed_image = analyze_image(encoded_image)
	print('image analyzed \n' + analyzed_image)
	audio_file = generate(text=analyzed_image, voice=voice, model="eleven_turbo_v2")

	if audio_file is not None:
	st.audio(audio_file, format='audio/mp3')
	st.download_button('Download Audio', audio_file, file_name='narrated.mp3')

	if __name__ == "__main__":
	main()