| cfg: | |
| sample_rate: 16000 | |
| train_ds: | |
| manifest_filepath: /content/datasets/ta/yaygomii/Tamil-Speech-Dialect-Corpus-Shuffled-Split/train/train_yaygomii_Tamil-Speech-Dialect-Corpus-Shuffled-Split_manifest_processed.json,/content/datasets/ta/yaygomii/Tamil-Speech-Dialect-Corpus-Shuffled-Split/valid/valid_yaygomii_Tamil-Speech-Dialect-Corpus-Shuffled-Split_manifest_processed.json | |
| sample_rate: 16000 | |
| batch_size: 16 | |
| trim_silence: true | |
| max_duration: 16.7 | |
| shuffle: true | |
| is_tarred: false | |
| tarred_audio_filepaths: null | |
| num_workers: 8 | |
| pin_memory: true | |
| use_start_end_token: true | |
| validation_ds: | |
| manifest_filepath: /content/datasets/ta/yaygomii/Tamil-Speech-Dialect-Corpus-Shuffled-Split/test/test_yaygomii_Tamil-Speech-Dialect-Corpus-Shuffled-Split_manifest_processed.json | |
| sample_rate: 16000 | |
| batch_size: 8 | |
| shuffle: false | |
| num_workers: 8 | |
| pin_memory: true | |
| use_start_end_token: true | |
| trim_silence: true | |
| test_ds: | |
| manifest_filepath: /content/datasets/ta/yaygomii/Tamil-Speech-Dialect-Corpus-Shuffled-Split/test/test_yaygomii_Tamil-Speech-Dialect-Corpus-Shuffled-Split_manifest_processed.json | |
| sample_rate: 16000 | |
| batch_size: 8 | |
| shuffle: false | |
| num_workers: 8 | |
| pin_memory: true | |
| use_start_end_token: true | |
| trim_silence: true | |
| model_defaults: | |
| repeat: 5 | |
| dropout: 0.0 | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| tokenizer: | |
| dir: tokenizers/ta/tokenizer_spe_bpe_v174/ | |
| type: bpe | |
| model_path: nemo:288fd8b4d3c64e75ac7a6b32b0f3586d_tokenizer.model | |
| vocab_path: nemo:6698e9428f25429e8ab2c5238438d52f_vocab.txt | |
| spe_tokenizer_vocab: nemo:344d9da9a52049caad7742ae1d994d19_tokenizer.vocab | |
| preprocessor: | |
| _target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor | |
| sample_rate: 16000 | |
| normalize: per_feature | |
| window_size: 0.025 | |
| window_stride: 0.01 | |
| window: hann | |
| features: 80 | |
| n_fft: 512 | |
| frame_splicing: 1 | |
| dither: 1.0e-05 | |
| pad_to: 16 | |
| stft_conv: false | |
| spec_augment: | |
| _target_: nemo.collections.asr.modules.SpectrogramAugmentation | |
| freq_masks: 2 | |
| time_masks: 10 | |
| freq_width: 25 | |
| time_width: 0.05 | |
| encoder: | |
| _target_: nemo.collections.asr.modules.ConvASREncoder | |
| feat_in: 80 | |
| activation: relu | |
| conv_mask: true | |
| jasper: | |
| - filters: 512 | |
| repeat: 1 | |
| kernel: | |
| - 5 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: false | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 11 | |
| stride: | |
| - 2 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| stride_last: true | |
| residual_mode: stride_add | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 13 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 15 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 17 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 19 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 21 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 13 | |
| stride: | |
| - 2 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| stride_last: true | |
| residual_mode: stride_add | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 15 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 17 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 19 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 21 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 23 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 25 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 25 | |
| stride: | |
| - 2 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| stride_last: true | |
| residual_mode: stride_add | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 27 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 29 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 31 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 33 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 35 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 37 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 512 | |
| repeat: 5 | |
| kernel: | |
| - 39 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: true | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| - filters: 640 | |
| repeat: 1 | |
| kernel: | |
| - 41 | |
| stride: | |
| - 1 | |
| dilation: | |
| - 1 | |
| dropout: 0.0 | |
| residual: false | |
| separable: true | |
| se: true | |
| se_context_size: -1 | |
| decoder: | |
| _target_: nemo.collections.asr.modules.ConvASRDecoder | |
| feat_in: 640 | |
| num_classes: 174 | |
| vocabulary: | |
| - <unk> | |
| - ்க | |
| - ம் | |
| - ▁ப | |
| - க்க | |
| - ்த | |
| - ன் | |
| - ்ட | |
| - ▁வ | |
| - ங்க | |
| - ரு | |
| - ▁இ | |
| - ▁க | |
| - ▁அ | |
| - ▁எ | |
| - க்கு | |
| - ▁ச | |
| - ல் | |
| - ந்த | |
| - ட்ட | |
| - ப் | |
| - ▁ந | |
| - த்த | |
| - து | |
| - ப்ப | |
| - ▁ம | |
| - ல்ல | |
| - ▁த | |
| - ்ச | |
| - ன்ன | |
| - ▁இரு | |
| - டி | |
| - டு | |
| - ▁போ | |
| - ும் | |
| - ந்து | |
| - ட்டு | |
| - ான் | |
| - ாங்க | |
| - ச்ச | |
| - ிய | |
| - ண் | |
| - மா | |
| - த்து | |
| - ▁வந்து | |
| - ர் | |
| - ▁பா | |
| - ண்ண | |
| - ▁ஒ | |
| - ல்லா | |
| - ண்ட | |
| - ▁ஆ | |
| - ம்ப | |
| - ேன் | |
| - னு | |
| - க்கா | |
| - னா | |
| - ைய | |
| - ▁மா | |
| - ▁இருக்கு | |
| - ▁கொ | |
| - ஸ் | |
| - ரி | |
| - ▁என்ன | |
| - ▁சொ | |
| - ▁சா | |
| - ச்சு | |
| - ள் | |
| - ▁ர | |
| - ▁பண்ண | |
| - ோம் | |
| - லா | |
| - ▁அப்ப | |
| - ட் | |
| - ஞ்ச | |
| - ▁கா | |
| - யி | |
| - ய் | |
| - ▁எங்க | |
| - ▁ஏ | |
| - ▁நா | |
| - ▁ஒரு | |
| - ▁அவ | |
| - ீங்க | |
| - ியா | |
| - ▁அது | |
| - ▁எல்லா | |
| - ▁கு | |
| - தி | |
| - ▁இல்ல | |
| - ▁வெ | |
| - ▁வே | |
| - ▁தான் | |
| - யா | |
| - ▁பே | |
| - றது | |
| - ▁செ | |
| - ுக்கு | |
| - ▁இருக்க | |
| - ண்டு | |
| - ில | |
| - ▁பி | |
| - ▁ட | |
| - ிரு | |
| - ளா | |
| - ் | |
| - ▁ | |
| - ு | |
| - க | |
| - ா | |
| - த | |
| - ட | |
| - ப | |
| - ம | |
| - ி | |
| - ன | |
| - ர | |
| - ல | |
| - வ | |
| - ச | |
| - ந | |
| - ங | |
| - ய | |
| - ே | |
| - ோ | |
| - ண | |
| - இ | |
| - . | |
| - அ | |
| - எ | |
| - ள | |
| - ை | |
| - ெ | |
| - ற | |
| - ொ | |
| - ீ | |
| - ஸ | |
| - ூ | |
| - ஒ | |
| - ஆ | |
| - ழ | |
| - ஞ | |
| - ஏ | |
| - ஷ | |
| - ஜ | |
| - ',' | |
| - உ | |
| - ஊ | |
| - ஓ | |
| - ஃ | |
| - ஹ | |
| - ஐ | |
| - ௌ | |
| - ஈ | |
| - '!' | |
| - '5' | |
| - '2' | |
| - '0' | |
| - '1' | |
| - _ | |
| - '3' | |
| - '6' | |
| - ஂ | |
| - g | |
| - k | |
| - m | |
| - p | |
| - s | |
| - '௫' | |
| - '7' | |
| - '8' | |
| - '9' | |
| - t | |
| - '௯' | |
| optim: | |
| name: novograd | |
| lr: 0.025 | |
| betas: | |
| - 0.8 | |
| - 0.25 | |
| weight_decay: 0.001 | |
| sched: | |
| name: CosineAnnealing | |
| warmup_steps: null | |
| warmup_ratio: 0.1 | |
| min_lr: 1.0e-09 | |
| last_epoch: -1 | |
| target: nemo.collections.asr.models.ctc_bpe_models.EncDecCTCModelBPE | |
| nemo_version: 1.22.0 | |
| decoding: | |
| strategy: greedy | |
| preserve_alignments: null | |
| compute_timestamps: null | |
| word_seperator: ' ' | |
| ctc_timestamp_type: all | |
| batch_dim_index: 0 | |
| greedy: | |
| preserve_alignments: false | |
| compute_timestamps: false | |
| preserve_frame_confidence: false | |
| confidence_method_cfg: | |
| name: entropy | |
| entropy_type: tsallis | |
| alpha: 0.33 | |
| entropy_norm: exp | |
| temperature: DEPRECATED | |
| beam: | |
| beam_size: 4 | |
| search_type: default | |
| preserve_alignments: false | |
| compute_timestamps: false | |
| return_best_hypothesis: true | |
| beam_alpha: 1.0 | |
| beam_beta: 0.0 | |
| kenlm_path: null | |
| flashlight_cfg: | |
| lexicon_path: null | |
| boost_path: null | |
| beam_size_token: 16 | |
| beam_threshold: 20.0 | |
| unk_weight: -.inf | |
| sil_weight: 0.0 | |
| pyctcdecode_cfg: | |
| beam_prune_logp: -10.0 | |
| token_min_logp: -5.0 | |
| prune_history: false | |
| hotwords: null | |
| hotword_weight: 10.0 | |
| confidence_cfg: | |
| preserve_frame_confidence: false | |
| preserve_token_confidence: false | |
| preserve_word_confidence: false | |
| exclude_blank: true | |
| aggregation: min | |
| method_cfg: | |
| name: entropy | |
| entropy_type: tsallis | |
| alpha: 0.33 | |
| entropy_norm: exp | |
| temperature: DEPRECATED | |
| temperature: 1.0 | |