Spaces:

Ratnesh-dev
/

diarize

Running on Zero

App Files Files Community

Ratnesh-dev commited on Apr 8

Commit

1103803

1 Parent(s): 71acebe

Simplify API-only diarization inputs

Browse files

Files changed (1) hide show

app.py +2 -12

app.py CHANGED Viewed

@@ -102,7 +102,6 @@ def _normalize_audio(audio_path: str) -> str:
 def _run_diarization(
     audio_path: str,
     hf_token: str,
-    prefer_exclusive: bool,
 ) -> tuple[list[dict[str, Any]], str, str, float]:
     pipeline = get_pipeline(hf_token)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -124,7 +123,7 @@ def _run_diarization(
     annotation_label = "speaker_diarization"
     exclusive_annotation = getattr(output, "exclusive_speaker_diarization", None)
-    if prefer_exclusive and exclusive_annotation is not None:
         annotation = exclusive_annotation
         annotation_label = "exclusive_speaker_diarization"
@@ -173,7 +172,6 @@ def _write_artifacts(segments: list[dict[str, Any]], rttm_text: str) -> list[str
 def diarize(
     audio_path: str | None,
     hf_token: str | None,
-    prefer_exclusive: bool,
 ):
     if not audio_path:
         raise gr.Error("Upload or record an audio file first.")
@@ -190,7 +188,6 @@ def diarize(
     segments, rttm_text, annotation_label, zerogpu_seconds = _run_diarization(
         audio_path=normalized_audio_path,
         hf_token=resolved_token,
-        prefer_exclusive=prefer_exclusive,
     )
     if not segments:
@@ -251,7 +248,7 @@ def build_demo() -> gr.Blocks:
         with gr.Row():
             with gr.Column(scale=1):
                 audio_input = gr.Audio(
-                    sources=["upload", "microphone"],
                     type="filepath",
                     label="Audio",
                 )
@@ -260,12 +257,6 @@ def build_demo() -> gr.Blocks:
                     type="password",
                     placeholder="hf_xxx",
                 )
-                prefer_exclusive = gr.Checkbox(
-                    value=True,
-                    label="Prefer exclusive speaker diarization when available",
-                )
                 run_button = gr.Button("Run diarization", variant="primary")
             with gr.Column(scale=1):
@@ -284,7 +275,6 @@ def build_demo() -> gr.Blocks:
             inputs=[
                 audio_input,
                 token_input,
-                prefer_exclusive,
             ],
             outputs=[summary_output, zerogpu_seconds_output, segments_output, turns_output, files_output],
         )

 def _run_diarization(
     audio_path: str,
     hf_token: str,
 ) -> tuple[list[dict[str, Any]], str, str, float]:
     pipeline = get_pipeline(hf_token)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     annotation_label = "speaker_diarization"
     exclusive_annotation = getattr(output, "exclusive_speaker_diarization", None)
+    if exclusive_annotation is not None:
         annotation = exclusive_annotation
         annotation_label = "exclusive_speaker_diarization"
 def diarize(
     audio_path: str | None,
     hf_token: str | None,
 ):
     if not audio_path:
         raise gr.Error("Upload or record an audio file first.")
     segments, rttm_text, annotation_label, zerogpu_seconds = _run_diarization(
         audio_path=normalized_audio_path,
         hf_token=resolved_token,
     )
     if not segments:
         with gr.Row():
             with gr.Column(scale=1):
                 audio_input = gr.Audio(
+                    sources=["upload"],
                     type="filepath",
                     label="Audio",
                 )
                     type="password",
                     placeholder="hf_xxx",
                 )
                 run_button = gr.Button("Run diarization", variant="primary")
             with gr.Column(scale=1):
             inputs=[
                 audio_input,
                 token_input,
             ],
             outputs=[summary_output, zerogpu_seconds_output, segments_output, turns_output, files_output],
         )