Xin Zhang
commited on
Commit
·
70b1d55
1
Parent(s):
38a440e
[fix]: opt parameter.
Browse files
transcribe/helpers/funasr.py
CHANGED
|
@@ -24,7 +24,7 @@ class FunASR:
|
|
| 24 |
def warmup(self, warmup_steps=1):
|
| 25 |
warmup_soundfile = f"{config.ASSERT_DIR}/jfk.flac"
|
| 26 |
for _ in range(warmup_steps):
|
| 27 |
-
self.model.generate(input=warmup_soundfile)
|
| 28 |
|
| 29 |
def transcribe(self, audio_buffer: bytes, language):
|
| 30 |
audio_frames = np.frombuffer(audio_buffer, dtype=np.float32)
|
|
|
|
| 24 |
def warmup(self, warmup_steps=1):
|
| 25 |
warmup_soundfile = f"{config.ASSERT_DIR}/jfk.flac"
|
| 26 |
for _ in range(warmup_steps):
|
| 27 |
+
self.model.generate(input=warmup_soundfile, disable_pbar=True)
|
| 28 |
|
| 29 |
def transcribe(self, audio_buffer: bytes, language):
|
| 30 |
audio_frames = np.frombuffer(audio_buffer, dtype=np.float32)
|
transcribe/pipelines/pipe_vad.py
CHANGED
|
@@ -33,12 +33,12 @@ class VadPipe(BasePipe):
|
|
| 33 |
def init(cls):
|
| 34 |
if cls.vac is None:
|
| 35 |
cls.vac = FixedVADIterator(
|
| 36 |
-
threshold=0.
|
| 37 |
sampling_rate=cls.sample_rate,
|
| 38 |
# speech_pad_ms=10
|
| 39 |
-
min_silence_duration_ms =
|
| 40 |
# speech_pad_ms = 30,
|
| 41 |
-
max_speech_duration_s=
|
| 42 |
)
|
| 43 |
cls.vac.reset_states()
|
| 44 |
|
|
|
|
| 33 |
def init(cls):
|
| 34 |
if cls.vac is None:
|
| 35 |
cls.vac = FixedVADIterator(
|
| 36 |
+
threshold=0.6,
|
| 37 |
sampling_rate=cls.sample_rate,
|
| 38 |
# speech_pad_ms=10
|
| 39 |
+
min_silence_duration_ms = 80,
|
| 40 |
# speech_pad_ms = 30,
|
| 41 |
+
max_speech_duration_s=25.0,
|
| 42 |
)
|
| 43 |
cls.vac.reset_states()
|
| 44 |
|