Spaces:

Sapna36
/

AI_Translator

Sleeping

App Files Files Community

Sapna36 commited on Feb 19, 2025

Commit

3597254

verified ·

1 Parent(s): ba61a38

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -15

app.py CHANGED Viewed

@@ -3,29 +3,28 @@ import requests
 from gtts import gTTS
 import os
 import uuid
-# Set your Groq API key
-GROQ_API_KEY = "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"  # 🔹 Replace with your actual key
 GROQ_API_URL = "https://api.groq.com/v1/chat/completions"
 # Function to process audio and return translated speech
-def voice_to_voice(audio):
-    if not audio:
         return "No audio received", None
-    # Save audio file
-    audio_path = f"input_{uuid.uuid4()}.wav"
-    with open(audio_path, "wb") as f:
-        f.write(audio)
     # Transcribe using Groq API
     headers = {"Authorization": f"Bearer {GROQ_API_KEY}"}
     data = {
-        "model": "llama3-8b",  # Adjust based on your Groq model availability
-        "messages": [{"role": "user", "content": "Transcribe this audio: " + audio_path}],
         "max_tokens": 100
     }
     response = requests.post(GROQ_API_URL, json=data, headers=headers)
     transcription = response.json().get("choices", [{}])[0].get("message", {}).get("content", "")
@@ -39,10 +38,10 @@ def voice_to_voice(audio):
     # Translate text using Groq API
     translate_data = {
         "model": "llama3-8b",
-        "messages": [{"role": "user", "content": f"Translate this from {source_lang} to {target_lang}: {transcription}"}],
         "max_tokens": 100
     }
     translate_response = requests.post(GROQ_API_URL, json=translate_data, headers=headers)
     translated_text = translate_response.json().get("choices", [{}])[0].get("message", {}).get("content", "")
@@ -59,8 +58,8 @@ def voice_to_voice(audio):
 # Gradio Interface
 with gr.Blocks() as demo:
     gr.Markdown("### 🎙️ **Urdu ↔ Pashto Real-Time Voice Translator**")
-    audio_input = gr.Audio(source="microphone", type="filepath", label="🎤 Speak Now")
     translated_text = gr.Textbox(label="📝 Translated Text")
     audio_output = gr.Audio(label="🔊 Translated Voice")
@@ -69,3 +68,4 @@ with gr.Blocks() as demo:
 demo.launch()

 from gtts import gTTS
 import os
 import uuid
+import soundfile as sf
+# Groq API key
+GROQ_API_KEY = "your-groq-api-key"  # 🔹 Replace this with your API key
 GROQ_API_URL = "https://api.groq.com/v1/chat/completions"
 # Function to process audio and return translated speech
+def voice_to_voice(audio_path):
+    if not audio_path:
         return "No audio received", None
+    # Read audio file
+    audio_data, samplerate = sf.read(audio_path)
     # Transcribe using Groq API
     headers = {"Authorization": f"Bearer {GROQ_API_KEY}"}
     data = {
+        "model": "llama3-8b",
+        "messages": [{"role": "user", "content": f"Transcribe this audio file: {audio_path}"}],
         "max_tokens": 100
     }
     response = requests.post(GROQ_API_URL, json=data, headers=headers)
     transcription = response.json().get("choices", [{}])[0].get("message", {}).get("content", "")
     # Translate text using Groq API
     translate_data = {
         "model": "llama3-8b",
+        "messages": [{"role": "user", "content": f"Translate from {source_lang} to {target_lang}: {transcription}"}],
         "max_tokens": 100
     }
     translate_response = requests.post(GROQ_API_URL, json=translate_data, headers=headers)
     translated_text = translate_response.json().get("choices", [{}])[0].get("message", {}).get("content", "")
 # Gradio Interface
 with gr.Blocks() as demo:
     gr.Markdown("### 🎙️ **Urdu ↔ Pashto Real-Time Voice Translator**")
+    audio_input = gr.Audio(type="filepath", label="🎤 Speak Now")
     translated_text = gr.Textbox(label="📝 Translated Text")
     audio_output = gr.Audio(label="🔊 Translated Voice")
 demo.launch()