Spaces:

Kquan
/

SD

Sleeping

Kquan commited on Nov 13

Commit

6af24e4

verified ·

1 Parent(s): 2692919

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,17 +8,14 @@ pipeline = Pipeline.from_pretrained(
     "pyannote/speaker-diarization-community-1", token=os.getenv('HF_TOKEN')
 )
-def diarize(audio_file):
     """
     Perform speaker diarization on uploaded audio file.
     """
-    # Save uploaded audio to temp file
-    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp:
-        tmp.write(audio_file.read())
-        tmp_path = tmp.name
     # Run diarization
-    diarization = pipeline(tmp_path)
     # Collect readable results
     results = []
@@ -27,8 +24,6 @@ def diarize(audio_file):
             f"{speaker}: {turn.start:.1f}s → {turn.end:.1f}s"
         )
-    # Clean up
-    os.remove(tmp_path)
     return "\n".join(results)
@@ -36,7 +31,7 @@ def diarize(audio_file):
 # 🎛️ Gradio interface
 demo = gr.Interface(
     fn=diarize,
-    inputs=gr.Audio(type="file", label="Upload Audio (.wav)"),
     outputs=gr.Textbox(label="Speaker Segments"),
     title="🎙️ Speaker Diarization Demo",
     description="Upload an audio file and detect who speaks when using Pyannote Audio."

     "pyannote/speaker-diarization-community-1", token=os.getenv('HF_TOKEN')
 )
+def diarize(audio_file_path):
     """
     Perform speaker diarization on uploaded audio file.
     """
     # Run diarization
+    diarization = pipeline(audio_file_path)
     # Collect readable results
     results = []
             f"{speaker}: {turn.start:.1f}s → {turn.end:.1f}s"
         )
     return "\n".join(results)
 # 🎛️ Gradio interface
 demo = gr.Interface(
     fn=diarize,
+    inputs=gr.Audio(type="filepath", label="Upload Audio (.wav)"),
     outputs=gr.Textbox(label="Speaker Segments"),
     title="🎙️ Speaker Diarization Demo",
     description="Upload an audio file and detect who speaks when using Pyannote Audio."