| import requests |
| from config import GROQ_API_KEY, GROQ_STT_MODEL |
|
|
| def speech_to_text(audio_file: str) -> str: |
| """ |
| Convert audio file to text using Groq's Whisper API (English only) |
| """ |
| if not GROQ_API_KEY: |
| raise RuntimeError("GROQ_API_KEY is not set in config") |
|
|
| url = "https://api.groq.com/openai/v1/audio/transcriptions" |
| |
| headers = { |
| "Authorization": f"Bearer {GROQ_API_KEY}" |
| } |
| |
| with open(audio_file, "rb") as audio_data: |
| files = { |
| "file": (audio_file, audio_data, "audio/wav") |
| } |
| data = { |
| "model": GROQ_STT_MODEL, |
| "language": "en", |
| "temperature": 0, |
| "response_format": "json" |
| } |
| |
| try: |
| response = requests.post(url, headers=headers, files=files, data=data, timeout=30) |
| response.raise_for_status() |
| |
| result = response.json() |
| return result.get("text", "") |
| |
| except requests.exceptions.RequestException as e: |
| raise Exception(f"Groq STT API error: {str(e)}") |
| except Exception as e: |
| raise Exception(f"Unexpected error in speech_to_text: {str(e)}") |