How to use G-Root/speaker-diarization-optimized with pyannote.audio:
from pyannote.audio import Pipeline pipeline = Pipeline.from_pretrained("G-Root/speaker-diarization-optimized") # inference on the whole file pipeline("file.wav") # inference on an excerpt from pyannote.core import Segment excerpt = Segment(start=2.0, end=5.0) from pyannote.audio import Audio waveform, sample_rate = Audio().crop("file.wav", excerpt) pipeline({"waveform": waveform, "sample_rate": sample_rate})