from services.gemini_client import get_gemini_client async def speech_to_text(audio_bytes: bytes) -> str: client = get_gemini_client() response = client.models.generate_content( model="gemini-2.5-flash", contents=[ { "mime_type": "audio/wav", "data": audio_bytes } ] ) text = response.text return text