Spaces:

OvozifyLabs
/

STT-whisper-small

Running

Firdavs222 commited on 17 days ago

Commit

a22c154

verified ·

1 Parent(s): 44ebbba

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -143,12 +143,17 @@ def transcribe_audio(audio_file_path):
         # Move inputs to the appropriate device
         input_features = inputs.input_features.to(device)
         with torch.no_grad():
-            # Use generation arguments to specify language and task for the Uz-Small model
             predicted_ids = model.generate(
-                input_features,
-                forced_decoder_ids=processor.get_decoder_prompt_ids(language="uz", task="transcribe"),
-                max_length=448 # Use a reasonable max length for speed/resource management
             )
         # Decode the generated token IDs to get the text transcript

         # Move inputs to the appropriate device
         input_features = inputs.input_features.to(device)
+        forced_ids = processor.get_decoder_prompt_ids(language="uz", task="transcribe")
+        gen_config = GenerationConfig(
+            forced_decoder_ids=forced_ids,
+            max_length=448
+        )
         with torch.no_grad():
             predicted_ids = model.generate(
+                input_features,
+                generation_config=gen_config
             )
         # Decode the generated token IDs to get the text transcript