| | from pywhispercpp.model import Model |
| | import config |
| | import soundfile |
| | from pywhispercpp.utils import to_timestamp |
| |
|
| | mel, _, = soundfile.read("test/6_before_cut_56640.wav") |
| | |
| |
|
| | models_dir = config.MODEL_DIR.as_posix() |
| | model = Model( |
| | model=config.WHISPER_MODEL, |
| | models_dir=models_dir, |
| | n_threads=4, |
| | print_realtime=False, |
| | print_progress=False, |
| | print_timestamps=False, |
| | translate=False, |
| | temperature=0., |
| | no_context=True |
| | ) |
| | print(mel.shape, mel.dtype) |
| | segments = model.transcribe(mel, |
| | |
| | language='en', |
| | |
| | |
| | token_timestamps=True, |
| | max_len=1,) |
| | for segment in segments: |
| | print(to_timestamp(segment.t0), to_timestamp(segment.t1), segment.text) |
| |
|