TestPublicRepo / config.yaml
Andrewy's picture
Upload config.yaml with huggingface_hub
99d3566 verified
acoustic:
left_pad: 0.3 # in sec
right_pad: 0.3 # in sec
chunk_size: 0.3 # in sec
state_size: 219729
frame_size: 0.03 # in sec
bias: 0.39 # in sec
sample_rate: 8000
labels: ["а", "б", "в", "г", "д", "е", "ё", "ж", "з", "и", "й", "к", "л", "м", "н", "о", "п",
"р", "с", "т", "у", "ф", "х", "ц", "ч", "ш", "щ", "ъ", "ы", "ь", "э", "ю", "я", " "]
splitter:
labels: ${acoustic.labels}
speech_offset: 0.1 # in sec
silence_duration_threshold: 0.6 # in sec
acoustic_silence_prob_threshold: 0.9 # in sec
min_acoustic_silence_frames: 3
phrase_duration_threshold: 60. # in sec; split very long phrase by force
decoder:
decoding_strategy: "beam_search" # greedy_search | beam_search
beam_search_params:
beam_width: 200
alpha: 0.4
beta: 0.9
unigrams: null