File size: 687 Bytes
0b3a48c
 
 
c710b8a
0b3a48c
 
 
 
 
 
 
 
 
 
 
 
c710b8a
0b3a48c
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import os
from .pipeline import ASR_Diarization


import json
import numpy as np

def load_known_embeddings(path="known_speakers.json"):
    if not os.path.exists(path):
        return {}
    with open(path, "r") as f:
        raw = json.load(f)
    return {name: np.array(emb, dtype=np.float32) for name, emb in raw.items()}

HF_TOKEN = os.environ.get("HF_TOKEN", None)
known_embeddings = load_known_embeddings()
pipe = ASR_Diarization(HF_TOKEN)

def inference(inputs):
    return pipe(inputs)

def inference_with_eval(inputs, output_dir, base_name, ref_rttm=None, ref_json=None):
    result = pipe(inputs)
    pipe.evaluate(output_dir, base_name, ref_rttm, ref_json)
    return result