Spaces:

MicroHealth
/

AV-to-transcripts

Paused

App Files Files Community

bluenevus commited on Apr 26, 2025

Commit

dce154d

verified ·

1 Parent(s): 4e7ec06

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -12

app.py CHANGED Viewed

@@ -71,13 +71,17 @@ app.layout = dbc.Container([
 def transcribe_and_diarize_audio(contents, filename):
     global generated_file, transcription_text
     try:
         content_type, content_string = contents.split(',')
         decoded = base64.b64decode(content_string)
-        with tempfile.NamedTemporaryFile(delete=False, suffix=os.path.splitext(filename)[1]) as temp_audio_file:
-            temp_audio_file.write(decoded)
-            temp_audio_file_path = temp_audio_file.name
         logger.info(f"File uploaded: {temp_audio_file_path}")
@@ -90,12 +94,14 @@ def transcribe_and_diarize_audio(contents, filename):
             audio.export(wav_path, format="wav")
             with open(wav_path, "rb") as audio_file:
                 transcript = openai.Audio.transcribe("whisper-1", audio_file)
-            transcription_text = transcript["text"]
-            # Perform diarization (speaker separation)
-            diarized_transcript = openai.Audio.transcribe("whisper-1", audio_file, speaker_detection=2)
             # Format the diarized transcript
             formatted_transcript = ""
@@ -114,10 +120,11 @@ def transcribe_and_diarize_audio(contents, filename):
         logger.error(f"Error during transcription and diarization: {str(e)}")
         return f"An error occurred during transcription and diarization: {str(e)}", False
     finally:
-        if os.path.exists(temp_audio_file_path):
-            os.unlink(temp_audio_file_path)
-        if os.path.exists(wav_path):
-            os.unlink(wav_path)
 @app.callback(
     [Output('output-audio-upload', 'children'),

 def transcribe_and_diarize_audio(contents, filename):
     global generated_file, transcription_text
+    temp_audio_file = None
+    wav_file = None
     try:
         content_type, content_string = contents.split(',')
         decoded = base64.b64decode(content_string)
+        # Create a temporary file that won't be immediately deleted
+        temp_audio_file = tempfile.NamedTemporaryFile(delete=False, suffix=os.path.splitext(filename)[1])
+        temp_audio_file.write(decoded)
+        temp_audio_file.close()  # Close the file but don't delete it yet
+        temp_audio_file_path = temp_audio_file.name
         logger.info(f"File uploaded: {temp_audio_file_path}")
             audio.export(wav_path, format="wav")
             with open(wav_path, "rb") as audio_file:
+                # Transcribe
                 transcript = openai.Audio.transcribe("whisper-1", audio_file)
+                # Rewind the file for diarization
+                audio_file.seek(0)
+                # Perform diarization (speaker separation)
+                diarized_transcript = openai.Audio.transcribe("whisper-1", audio_file, speaker_detection=2)
             # Format the diarized transcript
             formatted_transcript = ""
         logger.error(f"Error during transcription and diarization: {str(e)}")
         return f"An error occurred during transcription and diarization: {str(e)}", False
     finally:
+        # Clean up temporary files
+        if temp_audio_file:
+            os.unlink(temp_audio_file.name)
+        if wav_file:
+            os.unlink(wav_file)
 @app.callback(
     [Output('output-audio-upload', 'children'),