Spaces:

WajeehAzeemX
/

TashkeelAPI

Sleeping

WajeehAzeemX commited on Oct 16, 2024

Commit

7ea0248

verified ·

1 Parent(s): 76b2bae

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,14 +33,14 @@ async def transcribe_audio(request: Request):
         # Convert binary data to a file-like object
         audio_file = io.BytesIO(audio_data)
         # # Load the audio file using pydub
-        # audio_array, sampling_rate = librosa.load(audio_file, sr=16000)
         # # Process the audio array
         # input_features = processor(audio_array, sampling_rate=sampling_rate, return_tensors="pt").input_features
         # # Generate token ids
         # predicted_ids = model.generate(input_features)
         # # Decode token ids to text
         # transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
-        transcription = pipe(audio_file,generate_kwargs = {"task":"transcribe", "language":"<|ar|>"})
         # Print the transcription
         print(transcription)
         print(transcription[0])  # Display the transcriptiontry:

         # Convert binary data to a file-like object
         audio_file = io.BytesIO(audio_data)
         # # Load the audio file using pydub
+        audio_array, sampling_rate = librosa.load(audio_file, sr=16000)
         # # Process the audio array
         # input_features = processor(audio_array, sampling_rate=sampling_rate, return_tensors="pt").input_features
         # # Generate token ids
         # predicted_ids = model.generate(input_features)
         # # Decode token ids to text
         # transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
+        transcription = pipe(audio_array,generate_kwargs = {"task":"transcribe", "language":"<|ar|>"})
         # Print the transcription
         print(transcription)
         print(transcription[0])  # Display the transcriptiontry: