pixtral / app.py
bjoernix's picture
Update app.py
6bb6794 verified
raw
history blame
2.49 kB
import base64
import requests
from io import BytesIO
from PIL import Image
import gradio as gr
def encode_image(img):
buffered = BytesIO()
img.save(buffered, format="PNG")
encoded_string = base64.b64encode(buffered.getvalue()).decode("utf-8")
return encoded_string
def chat_with_pixtral(uploaded_file, user_question):
if uploaded_file is not None:
# uploaded_file ist bereits ein PIL-Bildobjekt.
base64_img = encode_image(uploaded_file)
api = "https://api.hyperbolic.xyz/v1/chat/completions"
api_key = "eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJzdWIiOiJyZzMyNzAyNEBnbWFpbC5jb20ifQ._frFve-BYZdb0Qo6FIj6xcDcxpY-6QlC2O-ToQxBjkc" # 여기에 API 키를 입력하세요
headers = {
"Content-Type": "application/json",
"Authorization": f"Bearer {api_key}",
}
payload = {
"messages": [
{
"role": "user",
"content": [
{"type": "text", "text": user_question}, # Vom Benutzer eingegebene Fragen
{
"type": "image_url",
"image_url": {"url": f"data:image/jpeg;base64,{base64_img}"},
},
],
}
],
"model": "mistralai/Pixtral-12B-2409",
"max_tokens": 2048,
"temperature": 0.7,
"top_p": 0.9,
}
response = requests.post(api, headers=headers, json=payload)
# Prüfen der API-Antwort
if response.status_code == 200:
response_data = response.json()
if 'choices' in response_data:
assistant_response = response_data['choices'][0]['message']['content']
else:
assistant_response = "Antwortformat ist falsch."
else:
assistant_response = f"Fehlerhafte API-Anforderung: {response.status_code} - {response.text}"
return assistant_response
return "Laden Sie ein Bild hoch und geben Sie Ihre Frage ein."
# Gradio Einstellungen der Schnittstelle
iface = gr.Interface(
fn=chat_with_pixtral,
inputs=[
gr.Image(type="pil", label="Ein Bild hochladen"),
gr.Textbox(label="Ihre Frage eingeben")
],
outputs="text",
title="Pixtral Image Chat",
description="Lade ein Bild hoch und gib deine Frage ein, um mit Pixtral zu sprechen."
)
iface.launch(share=True)