Capstone04
/

Bootstrapping

Automatic Speech Recognition

speaker-diarization

Model card Files Files and versions

Capstone04 commited on Oct 9, 2025

Commit

639e330

·

verified ·

1 Parent(s): 37111fb

Upload folder using huggingface_hub

Files changed (1) hide show

asr_diarization/pipeline.py +4 -4

asr_diarization/pipeline.py CHANGED Viewed

@@ -66,16 +66,16 @@ class ASR_Diarization:
                 for word_info in result["chunks"]:
                     start_ts, end_ts = word_info.get("timestamp", (None, None)) or (None, None)
                     tokens.append({
                         "start": start_ts,
                         "end": end_ts,
-                        "text": word_info["text"],
-                        "tag": "w"
                     })
             seg_dict = {
                 "speaker": spk,
-                "start": start,
-                "end": end,
                 "tokens": tokens
             }
             merged_segments.append(seg_dict)

                 for word_info in result["chunks"]:
                     start_ts, end_ts = word_info.get("timestamp", (None, None)) or (None, None)
                     tokens.append({
+                        "tag": "w",
                         "start": start_ts,
                         "end": end_ts,
+                        "text": word_info["text"]
                     })
             seg_dict = {
                 "speaker": spk,
+                "segment_start": start,
+                "segment_end": end,
                 "tokens": tokens
             }
             merged_segments.append(seg_dict)