malek-messaoudii
Refactor audio models and services for improved error handling and response streaming
9aa985d
raw
history blame
499 Bytes
from services.gemini_client import get_gemini_client
from google.genai import types
async def speech_to_text(audio_bytes: bytes) -> str:
"""
Convert speech audio (bytes) to text using Gemini API
"""
client = get_gemini_client()
# Wrap audio bytes correctly for Gemini
contents = [types.File(data=audio_bytes, mime_type="audio/wav")]
response = client.models.generate_content(
model="gemini-2.5-flash",
contents=contents
)
return response.text