Spaces:

BeastGokul
/

Communication-coach

Runtime error

BeastGokul commited on Aug 28, 2025

Commit

b5712d1

verified ·

1 Parent(s): f6b0982

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -39,12 +39,6 @@ model_name = "BeastGokul/Nika-1.5B"
 llm_tokenizer = AutoTokenizer.from_pretrained(model_name)
 llm_model = AutoModelForCausalLM.from_pretrained(model_name)
-# Option 2: OpenAI Whisper for speech recognition
-whisper_processor = AutoProcessor.from_pretrained("openai/whisper-large-v3")
-whisper_model = AutoModelForSpeechSeq2Seq.from_pretrained("openai/whisper-large-v3")
-# Option 3: Wav2Vec2 for phoneme-level analysis
 # Automatically use GPU if available
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -120,8 +114,9 @@ def save_audio(audio, user_id="default"):
 # Audio processing and phonetic analysis
 def transcribe_with_whisper(audio_path):
-    """Transcribe audio using OpenAI's Whisper model"""
-    result = whisper_model.transcribe(audio_path)
     return result["text"]
 def extract_phonemes(text):

 llm_tokenizer = AutoTokenizer.from_pretrained(model_name)
 llm_model = AutoModelForCausalLM.from_pretrained(model_name)
 # Automatically use GPU if available
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Audio processing and phonetic analysis
 def transcribe_with_whisper(audio_path):
+    """Transcribe audio using Hugging Face's pipeline for Whisper"""
+    asr_pipeline = pipeline("automatic-speech-recognition", model="openai/whisper-large-v3")
+    result = asr_pipeline(audio_path)
     return result["text"]
 def extract_phonemes(text):