| from services.gemini_client import get_gemini_client | |
| async def speech_to_text(audio_bytes: bytes) -> str: | |
| client = get_gemini_client() | |
| response = client.models.generate_content( | |
| model="gemini-2.5-flash", | |
| contents=[{"mime_type": "audio/wav", "data": audio_bytes}], | |
| ) | |
| return response.text | |