Spaces:

mrbeliever
/

Im-prmpt

Running

App Files Files Community

mrbeliever commited on Dec 4, 2024

Commit

d5a06f6

•

1 Parent(s): 9a78687

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -38

app.py CHANGED Viewed

@@ -1,27 +1,15 @@
-import os
-import base64
-import requests  # Import the requests module
-from PIL import Image
-from io import BytesIO
 import streamlit as st
-# Function to compress and resize the image before base64 encoding
-def compress_and_resize_image(image, max_size=(1024, 1024), quality=85):
-    img = Image.open(image)
-    img.thumbnail(max_size)  # Resize image while maintaining aspect ratio
-    byte_io = BytesIO()
-    img.save(byte_io, format="JPEG", quality=quality)  # Save with reduced quality
-    byte_io.seek(0)  # Make sure the pointer is at the beginning of the BytesIO buffer
-    return byte_io
-# Function to convert uploaded image to base64
 def convert_image_to_base64(image):
-    compressed_image = compress_and_resize_image(image)
-    image_bytes = compressed_image.read()  # Read from BytesIO before closing
     encoded_image = base64.b64encode(image_bytes).decode("utf-8")
     return encoded_image
-# Function to generate caption using Nebius API
 def generate_caption(encoded_image):
     API_URL = "https://api.studio.nebius.ai/v1/chat/completions"
     API_KEY = os.environ.get("NEBIUS_API_KEY")
@@ -32,7 +20,7 @@ def generate_caption(encoded_image):
     }
     payload = {
-        "model": "Qwen/Qwen2-VL-72B-Instruct",
         "messages": [
             {
                 "role": "system",
@@ -40,19 +28,20 @@ def generate_caption(encoded_image):
             },
             {
                 "role": "user",
-                "content": "Write a caption for this image"
-            },
-            {
-                "role": "user",
-                "content": f"data:image/png;base64,{encoded_image}"  # This is where the image is passed as base64 directly
             }
         ],
-        "temperature": 0
     }
-    # Send request to Nebius API
     response = requests.post(API_URL, headers=headers, json=payload)
     if response.status_code == 200:
         result = response.json()
         caption = result.get("choices", [{}])[0].get("message", {}).get("content", "No caption generated.")
@@ -61,32 +50,58 @@ def generate_caption(encoded_image):
         st.error(f"API Error {response.status_code}: {response.text}")
         return None
-# Streamlit app layout
 def main():
-    st.set_page_config(page_title="Image Caption Generator", layout="centered", initial_sidebar_state="collapsed")
-    st.title("🖼️ Image to Caption Generator")
-    uploaded_file = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])
     if uploaded_file:
         # Display the uploaded image
         st.image(uploaded_file, caption="Uploaded Image", use_container_width=True)
         if st.button("Generate Caption"):
-            # Convert the uploaded image to base64
             with st.spinner("Generating caption..."):
                 encoded_image = convert_image_to_base64(uploaded_file)
-                # Debugging: Ensure the encoded image is valid and not too large
-                st.write(f"Encoded image length: {len(encoded_image)} characters")
-                # Get the generated caption from the API
                 caption = generate_caption(encoded_image)
                 if caption:
                     st.subheader("Generated Caption:")
                     st.text_area("", caption, height=100, key="caption_area")
-                    st.success("Caption generated successfully!")
 if __name__ == "__main__":
     main()

 import streamlit as st
+import requests
+import base64
+import os
+# Function to convert image to base64
 def convert_image_to_base64(image):
+    image_bytes = image.read()
     encoded_image = base64.b64encode(image_bytes).decode("utf-8")
     return encoded_image
+# Function to generate a caption using Nebius API
 def generate_caption(encoded_image):
     API_URL = "https://api.studio.nebius.ai/v1/chat/completions"
     API_KEY = os.environ.get("NEBIUS_API_KEY")
     }
     payload = {
+        "model": "llava-hf/llava-1.5-7b-hf",
         "messages": [
             {
                 "role": "system",
             },
             {
                 "role": "user",
+                "content": "write a detailed caption for this image"
             }
         ],
+        "image": {
+            "type": "image_url",
+            "image_url": {
+                "url": f"data:image/png;base64,{encoded_image}"
+            }
+        },
+        "temperature": 0.7
     }
     response = requests.post(API_URL, headers=headers, json=payload)
     if response.status_code == 200:
         result = response.json()
         caption = result.get("choices", [{}])[0].get("message", {}).get("content", "No caption generated.")
         st.error(f"API Error {response.status_code}: {response.text}")
         return None
+# Streamlit app
 def main():
+    st.set_page_config(page_title="Image to Caption Converter", layout="centered", initial_sidebar_state="collapsed")
+    # Gradient background style
+    st.markdown("""
+        <style>
+            body {
+                background: linear-gradient(135deg, #1e3c72, #2a5298);
+                color: white;
+                font-family: 'Arial', sans-serif;
+            }
+            .uploaded-image {
+                max-width: 100%;
+                border: 2px solid #ffffff;
+                border-radius: 10px;
+            }
+            .copy-button {
+                background-color: #ff8800;
+                color: white;
+                border: none;
+                border-radius: 5px;
+                padding: 10px 15px;
+                cursor: pointer;
+            }
+            .copy-button:hover {
+                background-color: #cc6b00;
+            }
+        </style>
+    """, unsafe_allow_html=True)
+    st.title("🖼️ Image to Caption Converter")
+    uploaded_file = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])
     if uploaded_file:
         # Display the uploaded image
         st.image(uploaded_file, caption="Uploaded Image", use_container_width=True)
+        # Convert image to base64 and get caption
         if st.button("Generate Caption"):
             with st.spinner("Generating caption..."):
                 encoded_image = convert_image_to_base64(uploaded_file)
                 caption = generate_caption(encoded_image)
                 if caption:
                     st.subheader("Generated Caption:")
                     st.text_area("", caption, height=100, key="caption_area")
+                    # Copy button
+                    if st.button("Copy to Clipboard"):
+                        st.code(caption, language="text")
+                        st.success("Caption copied to clipboard!")
 if __name__ == "__main__":
     main()