Spaces:

matejmicek
/

attentionborrow

Sleeping

App Files Files Community

matejmicek commited on Nov 17, 2023

Commit

bb971e5

1 Parent(s): b58467b

Create app.py

Browse files

Files changed (1) hide show

app.py +108 -0

app.py ADDED Viewed

	@@ -0,0 +1,108 @@

+import streamlit as st
+import os
+from openai import OpenAI
+import openai
+import base64
+import time
+import errno
+from elevenlabs import generate, play, voices
+from elevenlabs import voices, set_api_key
+set_api_key("8f73d4bd2ab582e4950964e5ecb12aaa")
+voice = voices()[-1]
+client = OpenAI(api_key='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')
+def encode_image(image_path):
+    while True:
+        try:
+            with open(image_path, "rb") as image_file:
+                return base64.b64encode(image_file.read()).decode("utf-8")
+        except IOError as e:
+            if e.errno != errno.EACCES:
+                # Not a "file in use" error, re-raise
+                raise
+            # File is being written to, wait a bit and retry
+            time.sleep(0.1)
+def generate_new_line(base64_image):
+    return [
+        {
+            "role": "user",
+            "content": [
+                {"type": "text", "text": "Describe this image"},
+                {
+                    "type": "image_url",
+                    "image_url": f"data:image/jpeg;base64,{base64_image}",
+                },
+            ],
+        },
+    ]
+def analyze_image(base64_image):
+    response = client.chat.completions.create(
+        model="gpt-4-vision-preview",
+        messages=[
+            {
+                "role": "system",
+                "content": """
+                You are Sir David Attenborough. Narrate the picture of the human as if it is a nature documentary.
+                Make it snarky and funny. Don't repeat yourself. Make it short. If I do anything remotely interesting, make a big deal about it!
+                """,
+            },
+        ]
+        + generate_new_line(base64_image),
+        max_tokens=500,
+    )
+    response_text = response.choices[0].message.content
+    return response_text
+from io import BytesIO
+import os
+def save_uploaded_file(uploaded_file):
+    # Create a directory to save the file
+    save_path = 'uploaded_images'
+    if not os.path.exists(save_path):
+        os.makedirs(save_path)
+    # Save the file
+    with open(os.path.join(save_path, 'temp'), "wb") as f:
+        f.write(uploaded_file.getbuffer())
+    return os.path.join(save_path, 'temp')
+def process():
+    pass # Assuming 'process' is defined in 'your_processing_module'
+def main():
+    st.title("Image to Audio Converter")
+    # Image upload
+    uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "png", "jpeg"])
+    if uploaded_file:
+        path = save_uploaded_file(uploaded_file)
+        print(f'file saved to {path}')
+        encoded_image = encode_image(path)
+        print('image encoded')
+        analyzed_image = analyze_image(encoded_image)
+        print('image analyzed \n' + analyzed_image)
+        audio_file = generate(text=analyzed_image, voice=voice, model="eleven_turbo_v2")
+        if audio_file is not None:
+            st.audio(audio_file, format='audio/mp3')
+            st.download_button('Download Audio', audio_file, file_name='narrated.mp3')
+if __name__ == "__main__":
+    main()