|
|
acoustic: |
|
|
left_pad: 0.3 |
|
|
right_pad: 0.3 |
|
|
chunk_size: 0.3 |
|
|
state_size: 219729 |
|
|
frame_size: 0.03 |
|
|
bias: 0.39 |
|
|
sample_rate: 8000 |
|
|
labels: ["а", "б", "в", "г", "д", "е", "ё", "ж", "з", "и", "й", "к", "л", "м", "н", "о", "п", |
|
|
"р", "с", "т", "у", "ф", "х", "ц", "ч", "ш", "щ", "ъ", "ы", "ь", "э", "ю", "я", " "] |
|
|
|
|
|
splitter: |
|
|
labels: ${acoustic.labels} |
|
|
speech_offset: 0.1 |
|
|
silence_duration_threshold: 0.6 |
|
|
acoustic_silence_prob_threshold: 0.9 |
|
|
min_acoustic_silence_frames: 3 |
|
|
phrase_duration_threshold: 60. |
|
|
|
|
|
decoder: |
|
|
decoding_strategy: "beam_search" |
|
|
beam_search_params: |
|
|
beam_width: 200 |
|
|
alpha: 0.4 |
|
|
beta: 0.9 |
|
|
unigrams: null |
|
|
|