diff --git "a/exp/run.log" "b/exp/run.log" new file mode 100644--- /dev/null +++ "b/exp/run.log" @@ -0,0 +1,3376 @@ +2026-01-08 18:33:28 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T18:33:28.816246 === +2026-01-08 18:33:28 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 18:33:28 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 18:33:28 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 18:33:28 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 18:33:28 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=e649581628c3a7d875d2e1ee9c795b7595d4fcb7, short_commit=e649581628, branch=espnet3/integration_test, worktree=dirty +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models: +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 18:34:35 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 18:34:35 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 18:34:35 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 18:34:35 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 18:34:36 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'create_dataset' failed after 0.63s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py", line 64, in create_dataset + result = fn(**extra) + ^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py", line 135, in create_dataset + raise RuntimeError("sph2pipe not found in PATH. Please install it.") +RuntimeError: sph2pipe not found in PATH. Please install it. +2026-01-08 18:36:19 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T18:36:19.909692 === +2026-01-08 18:36:19 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 18:36:19 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 18:36:19 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 18:36:19 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 18:36:19 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=e649581628c3a7d875d2e1ee9c795b7595d4fcb7, short_commit=e649581628, branch=espnet3/integration_test, worktree=dirty +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models: +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 18:36:32 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 18:36:32 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.43s using src.create_dataset.create_dataset +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.43s) === +2026-01-08 18:36:32 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:131 | Building tokenizer training text via src.tokenizer.gather_training_text +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:151 | Collected 4 transcript lines for tokenizer training +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:155 | Training tokenizer: bpe +2026-01-08 18:36:32 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:156 | Tokenizer output: ./data/bpe_30 +2026-01-08 18:36:33 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:165 | Tokenizer training completed in 0.09s +2026-01-08 18:36:33 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.09s) === +2026-01-08 18:36:33 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 18:36:33 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 18:36:41 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 18:36:41 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 18:36:41 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 8.38s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 92, in _call_target + return _target_(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^ +TypeError: CommonPreprocessor.__init__() missing 1 required positional argument: 'train' + +The above exception was the direct cause of the following exception: + +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 68, in collect_stats + trainer = _build_trainer(cfg) + ^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 34, in _build_trainer + lit_model = LitESPnetModel(model, cfg) + ^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 47, in __init__ + data_organizer = instantiate(config.dataset) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 226, in instantiate + return instantiate_node( + ^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 342, in instantiate_node + value = instantiate_node( + ^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 347, in instantiate_node + return _call_target(_target_, partial, args, kwargs, full_key) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 97, in _call_target + raise InstantiationException(msg) from e +hydra.errors.InstantiationException: Error in call to target 'espnet2.train.preprocessor.CommonPreprocessor': +TypeError("CommonPreprocessor.__init__() missing 1 required positional argument: 'train'") +full_key: dataset.preprocessor +2026-01-08 18:38:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T18:38:37.023878 === +2026-01-08 18:38:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 18:38:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 18:38:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 18:38:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 18:38:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=e649581628c3a7d875d2e1ee9c795b7595d4fcb7, short_commit=e649581628, branch=espnet3/integration_test, worktree=dirty +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + train: true + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 18:38:49 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 18:38:49 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 18:38:49 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 18:38:49 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 18:38:49 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.21s using src.create_dataset.create_dataset +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.22s) === +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 18:38:49 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.01s) === +2026-01-08 18:38:49 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 18:38:49 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 18:38:57 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 18:38:58 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 18:38:58 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 18:38:58 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 18:38:58 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 18:38:58 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 18:38:58 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 18:38:59 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 9.63s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 69, in collect_stats + trainer.collect_stats() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/training/trainer.py", line 205, in collect_stats + return self.model.collect_stats(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 438, in collect_stats + collect_stats( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 512, in collect_stats + sum_dict, sq_dict, count_dict = _collect_stats_common( + ^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 375, in _collect_stats_common + results = runner(index_batches) + ^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 340, in __call__ + return self._run_local(indices) + ^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in _run_local + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 328, in forward + return batch_collect_stats( + ^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 44, in batch_collect_stats + item = dataset[i] + ~~~~~~~^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/dataset.py", line 151, in __getitem__ + transformed = self.transforms[i][1](str(idx), transformed) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/preprocessor.py", line 547, in __call__ + data = self._speech_process(data) + ^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/preprocessor.py", line 451, in _speech_process + data[self.speech_name] = self.data_aug( + ^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/layers/augmentation.py", line 99, in __call__ + print(effect) + +IndexError: list index out of range +2026-01-08 18:40:16 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T18:40:16.707156 === +2026-01-08 18:40:16 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 18:40:16 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 18:40:16 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 18:40:16 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 18:40:16 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=e649581628c3a7d875d2e1ee9c795b7595d4fcb7, short_commit=e649581628, branch=espnet3/integration_test, worktree=dirty +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + train: true + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 18:40:29 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 18:40:29 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 18:40:29 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 18:40:29 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 18:40:29 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.20s using src.create_dataset.create_dataset +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.20s) === +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 18:40:29 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 18:40:29 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 18:40:29 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 18:40:37 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 18:40:37 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 18:40:37 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 18:40:37 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 18:40:37 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 18:40:37 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 18:40:38 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 18:40:38 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 9.00s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 69, in collect_stats + trainer.collect_stats() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/training/trainer.py", line 205, in collect_stats + return self.model.collect_stats(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 438, in collect_stats + collect_stats( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 512, in collect_stats + sum_dict, sq_dict, count_dict = _collect_stats_common( + ^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 375, in _collect_stats_common + results = runner(index_batches) + ^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 340, in __call__ + return self._run_local(indices) + ^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in _run_local + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 328, in forward + return batch_collect_stats( + ^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 44, in batch_collect_stats + item = dataset[i] + ~~~~~~~^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/dataset.py", line 151, in __getitem__ + transformed = self.transforms[i][1](str(idx), transformed) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/preprocessor.py", line 547, in __call__ + data = self._speech_process(data) + ^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/preprocessor.py", line 451, in _speech_process + data[self.speech_name] = self.data_aug( + ^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/layers/augmentation.py", line 100, in __call__ + if isinstance(effect[1], list): + ~~~~~~^^^ +IndexError: list index out of range +2026-01-08 19:02:51 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T19:02:51.458046 === +2026-01-08 19:02:51 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 19:02:51 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 19:02:51 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 19:02:51 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 19:02:51 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=7fae474de17d0a228f7ebb269ada1103e8014e6c, short_commit=7fae474de1, branch=espnet3/integration_test, worktree=dirty +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 19:03:03 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 19:03:03 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 19:03:03 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 19:03:03 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 19:03:04 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 19:03:04 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.18s using src.create_dataset.create_dataset +2026-01-08 19:03:04 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.18s) === +2026-01-08 19:03:04 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 19:03:04 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 19:03:04 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 19:03:04 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 19:03:04 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:03:11 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:03:11 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:03:11 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 7.66s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 92, in _call_target + return _target_(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^ +TypeError: CommonPreprocessor.__init__() missing 1 required positional argument: 'train' + +The above exception was the direct cause of the following exception: + +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 68, in collect_stats + trainer = _build_trainer(cfg) + ^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 34, in _build_trainer + lit_model = LitESPnetModel(model, cfg) + ^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 47, in __init__ + data_organizer = instantiate(config.dataset) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 226, in instantiate + return instantiate_node( + ^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 342, in instantiate_node + value = instantiate_node( + ^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 347, in instantiate_node + return _call_target(_target_, partial, args, kwargs, full_key) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 97, in _call_target + raise InstantiationException(msg) from e +hydra.errors.InstantiationException: Error in call to target 'espnet2.train.preprocessor.CommonPreprocessor': +TypeError("CommonPreprocessor.__init__() missing 1 required positional argument: 'train'") +full_key: dataset.preprocessor +2026-01-08 19:05:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T19:05:24.823181 === +2026-01-08 19:05:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 19:05:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 19:05:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 19:05:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 19:05:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=7fae474de17d0a228f7ebb269ada1103e8014e6c, short_commit=7fae474de1, branch=espnet3/integration_test, worktree=dirty +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 19:05:37 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 19:05:37 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 19:05:37 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 19:05:37 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 19:05:37 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.18s using src.create_dataset.create_dataset +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.18s) === +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 19:05:37 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 19:05:37 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 19:05:37 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:05:45 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:05:45 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:05:45 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 7.81s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 92, in _call_target + return _target_(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^ +TypeError: CommonPreprocessor.__init__() missing 1 required positional argument: 'train' + +The above exception was the direct cause of the following exception: + +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 68, in collect_stats + trainer = _build_trainer(cfg) + ^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 34, in _build_trainer + lit_model = LitESPnetModel(model, cfg) + ^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 47, in __init__ + data_organizer = instantiate(config.dataset) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 226, in instantiate + return instantiate_node( + ^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 342, in instantiate_node + value = instantiate_node( + ^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 347, in instantiate_node + return _call_target(_target_, partial, args, kwargs, full_key) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/hydra/_internal/instantiate/_instantiate2.py", line 97, in _call_target + raise InstantiationException(msg) from e +hydra.errors.InstantiationException: Error in call to target 'espnet2.train.preprocessor.CommonPreprocessor': +TypeError("CommonPreprocessor.__init__() missing 1 required positional argument: 'train'") +full_key: dataset.preprocessor +2026-01-08 19:08:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T19:08:11.791472 === +2026-01-08 19:08:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 19:08:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 19:08:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 19:08:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 19:08:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=7fae474de17d0a228f7ebb269ada1103e8014e6c, short_commit=7fae474de1, branch=espnet3/integration_test, worktree=dirty +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + fs: 16000 + train: true + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 19:08:25 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 19:08:25 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 19:08:25 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 19:08:25 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 19:08:25 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.27s using src.create_dataset.create_dataset +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.28s) === +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 19:08:25 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 19:08:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 19:08:25 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:08:32 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:08:33 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:08:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 19:08:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 19:08:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 19:08:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 19:08:33 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:08:33 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 8.50s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 69, in collect_stats + trainer.collect_stats() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/training/trainer.py", line 205, in collect_stats + return self.model.collect_stats(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 444, in collect_stats + collect_stats( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 512, in collect_stats + sum_dict, sq_dict, count_dict = _collect_stats_common( + ^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 375, in _collect_stats_common + results = runner(index_batches) + ^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 340, in __call__ + return self._run_local(indices) + ^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in _run_local + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 328, in forward + return batch_collect_stats( + ^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 44, in batch_collect_stats + item = dataset[i] + ~~~~~~~^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/dataset.py", line 151, in __getitem__ + transformed = self.transforms[i][1](str(idx), transformed) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/preprocessor.py", line 547, in __call__ + data = self._speech_process(data) + ^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/preprocessor.py", line 451, in _speech_process + data[self.speech_name] = self.data_aug( + ^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/layers/augmentation.py", line 100, in __call__ + if isinstance(effect[1], list): + ~~~~~~^^^ +IndexError: list index out of range +2026-01-08 19:16:30 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T19:16:30.139396 === +2026-01-08 19:16:30 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 19:16:30 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 19:16:30 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 19:16:30 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 19:16:30 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=7fae474de17d0a228f7ebb269ada1103e8014e6c, short_commit=7fae474de1, branch=espnet3/integration_test, worktree=dirty +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + _convert_: all + fs: 16000 + train: true + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 19:16:43 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 19:16:43 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 19:16:43 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 19:16:43 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 19:16:44 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 19:16:44 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.20s using src.create_dataset.create_dataset +2026-01-08 19:16:44 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.20s) === +2026-01-08 19:16:44 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 19:16:44 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 19:16:44 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 19:16:44 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 19:16:44 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:16:51 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:16:51 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:16:51 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 19:16:51 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 19:16:51 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 19:16:51 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 19:16:52 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:16:52 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 8.42s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 69, in collect_stats + trainer.collect_stats() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/training/trainer.py", line 205, in collect_stats + return self.model.collect_stats(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 444, in collect_stats + collect_stats( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 512, in collect_stats + sum_dict, sq_dict, count_dict = _collect_stats_common( + ^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 375, in _collect_stats_common + results = runner(index_batches) + ^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 340, in __call__ + return self._run_local(indices) + ^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in _run_local + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 328, in forward + return batch_collect_stats( + ^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 56, in batch_collect_stats + batch = collate_fn(structured_items) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/collate_fn.py", line 38, in __call__ + return common_collate_fn( + ^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/collate_fn.py", line 404, in common_collate_fn + if data[0][key].dtype.kind == "i": + ^^^^^^^^^^^^^^^^^^ +AttributeError: 'str' object has no attribute 'dtype' +2026-01-08 19:22:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T19:22:11.289407 === +2026-01-08 19:22:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 19:22:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 19:22:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 19:22:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 19:22:11 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=7fae474de17d0a228f7ebb269ada1103e8014e6c, short_commit=7fae474de1, branch=espnet3/integration_test, worktree=dirty +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + _convert_: all + fs: 16000 + train: true + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 19:22:24 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 19:22:24 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 19:22:24 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 19:22:24 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 19:22:24 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.18s using src.create_dataset.create_dataset +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.18s) === +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 19:22:24 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 19:22:24 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 19:22:24 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:22:32 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:22:33 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:22:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 19:22:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 19:22:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 19:22:33 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 19:22:33 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:22:33 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'collect_stats' failed after 9.07s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 84, in collect_stats + return collect_stats(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 69, in collect_stats + trainer.collect_stats() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/training/trainer.py", line 205, in collect_stats + return self.model.collect_stats(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 444, in collect_stats + collect_stats( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 512, in collect_stats + sum_dict, sq_dict, count_dict = _collect_stats_common( + ^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 375, in _collect_stats_common + results = runner(index_batches) + ^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 340, in __call__ + return self._run_local(indices) + ^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in _run_local + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/parallel/base_runner.py", line 209, in + return [f(i, **env) for i in tqdm(indices, total=len(indices))] + ^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 328, in forward + return batch_collect_stats( + ^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/data/collect_stats.py", line 56, in batch_collect_stats + batch = collate_fn(structured_items) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/collate_fn.py", line 38, in __call__ + return common_collate_fn( + ^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet2/train/collate_fn.py", line 405, in common_collate_fn + if data[0][key].dtype.kind == "i": + ^^^^^^^^^^^^^^^^^^ +AttributeError: 'str' object has no attribute 'dtype' +2026-01-08 19:24:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:152 | === ESPnet3 run started: 2026-01-08T19:24:25.834405 === +2026-01-08 19:24:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:153 | Command: /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin/python run.py --train_config conf/train_asr_rnn_data_aug_debug.yaml --infer_config conf/infer.yaml --measure_config conf/measure.yaml +2026-01-08 19:24:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:156 | Working directory: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr +2026-01-08 19:24:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | train config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/train_asr_rnn_data_aug_debug.yaml +2026-01-08 19:24:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | infer config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/infer.yaml +2026-01-08 19:24:25 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:162 | measure config: /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/conf/measure.yaml +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:167 | Git: commit=7fae474de17d0a228f7ebb269ada1103e8014e6c, short_commit=7fae474de1, branch=espnet3/integration_test, worktree=dirty +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:250 | Cluster env: +(none) +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/logging.py:251 | Runtime env: +LD_LIBRARY_PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/lib64:/usr/local/cuda-10.1/lib64 +PATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/ffmpeg-release:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/festival/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/MBROLA/Bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/espeak-ng/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/BeamformIt:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kenlm/build/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/PESQ/P862_annex_A_2005_CD/source:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/nkf/nkf-2.1.4:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/tokenizer:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/generic:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/tools/moses/scripts/recaser:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/moses/scripts/training:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/mwerSegmenter:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sctk/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sph2pipe:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/sentencepiece_commands:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/chainbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/featbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/fstbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/gmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/ivectorbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/kwsbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/latbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/lmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnet3bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/nnetbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/online2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/onlinebin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/rnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmm2bin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/sgmmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/tfrnnlmbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudadecoderbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/kaldi/src/cudafeatbin:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/bin:/home/masao/.local/bin:/home/masao/utils:/home/masao/git/SCTK/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/usr/lib/wsl/lib:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/debugCommand:/mnt/c/Users/might/AppData/Roaming/Code/User/globalStorage/github.copilot-chat/copilotCli:/mnt/c/Windows/system32:/mnt/c/Windows:/mnt/c/Windows/System32/Wbem:/mnt/c/Windows/System32/WindowsPowerShell/v1.0/:/mnt/c/Windows/System32/OpenSSH/:/mnt/c/Program Files (x86)/NVIDIA Corporation/PhysX/Common:/mnt/c/Program Files/NVIDIA Corporation/NVIDIA NvDLISR:/mnt/c/Program Files/dotnet/:/mnt/c/Program Files/Git/cmd:/mnt/c/Program Files/Tailscale/:/mnt/c/Users/might/AppData/Local/Microsoft/WindowsApps:/mnt/c/Users/might/AppData/Local/Programs/Microsoft VS Code/bin:/mnt/c/Users/might/AppData/Local/Muse Hub/lib:/mnt/c/Software/cmake-3.30.2-windows-x86_64/bin:/mnt/c/Software/flutter/bin:/mnt/c/Users/might/.vscode/extensions/ms-python.debugpy-2025.18.0-win32-x64/bundled/scripts/noConfigScripts:/snap/bin:/mnt/c/Software/flutter/bin +PYTHONPATH=/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3:/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/RawNet/python/RawNet3/models:../../../:../../TEMPLATE/asr:/mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr: +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:140 | Train config content: +num_device: 1 +num_nodes: 1 +task: espnet3.systems.asr.task.ASRTask +recipe_dir: . +data_dir: ./data +exp_tag: train_asr_rnn_data_aug_debug +exp_dir: ./exp/train_asr_rnn_data_aug_debug +stats_dir: ./exp/stats +decode_dir: ./exp/train_asr_rnn_data_aug_debug/decode +dataset_dir: ./data/mini_an4 +create_dataset: + func: src.create_dataset.create_dataset + dataset_dir: ./data/mini_an4 + archive_path: ./../../egs2/mini_an4/asr1/downloads.tar.gz +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + train: + - name: train_nodev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv + valid: + - name: train_dev + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/train_dev.tsv + preprocessor: + _target_: espnet2.train.preprocessor.CommonPreprocessor + _convert_: all + fs: 16000 + train: true + data_aug_effects: + - - 0.1 + - contrast + - enhancement_amount: 75.0 + - - 0.1 + - highpass + - cutoff_freq: 5000 + Q: 0.707 + - - 0.1 + - equalization + - center_freq: 1000 + gain: 0 + Q: 0.707 + - - 0.1 + - - - 0.3 + - speed_perturb + - factor: 0.9 + - - 0.3 + - speed_perturb + - factor: 1.1 + - - 0.3 + - speed_perturb + - factor: 1.3 + data_aug_num: + - 1 + - 4 + data_aug_prob: 1.0 + token_type: bpe + token_list: ./data/bpe_30/tokens.txt + bpemodel: ./data/bpe_30/bpe.model +parallel: + env: local + n_workers: 1 +dataloader: + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + train: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: true + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + num_workers: 0 + batches: + type: folded + shape_files: + - ./exp/stats/train/feats_shape + batch_size: 2 + batch_bins: 200000 + valid: + multiple_iterator: false + num_shards: 1 + iter_factory: + _target_: espnet2.iterators.sequence_iter_factory.SequenceIterFactory + shuffle: false + collate_fn: + _target_: espnet2.train.collate_fn.CommonCollateFn + int_pad_value: -1 + batches: + type: folded + shape_files: + - ./exp/stats/valid/feats_shape + batch_size: 2 + batch_bins: 200000 +optim: + _target_: torch.optim.Adam + lr: 0.001 + weight_decay: 0.0 +scheduler: + _target_: torch.optim.lr_scheduler.ReduceLROnPlateau + mode: min + factor: 0.5 + patience: 1 +val_scheduler_criterion: +- valid +- loss +best_model_criterion: +- - valid/acc + - 1 + - max +trainer: + accelerator: auto + devices: 1 + num_nodes: 1 + accumulate_grad_batches: 1 + check_val_every_n_epoch: 1 + gradient_clip_val: 1.0 + log_every_n_steps: 1 + max_epochs: 1 + limit_train_batches: 1 + limit_val_batches: 1 + precision: 32 + logger: + - _target_: lightning.pytorch.loggers.TensorBoardLogger + save_dir: ./exp/train_asr_rnn_data_aug_debug/tensorboard + name: tb_logger + strategy: auto +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + text_builder: + func: src.tokenizer.gather_training_text + manifest_path: ./data/mini_an4/manifest/train_nodev.tsv +model: + vocab_size: 30 + token_list: ./data/bpe_30/tokens.txt + encoder: vgg_rnn + encoder_conf: + num_layers: 1 + hidden_size: 2 + output_size: 2 + decoder: rnn + decoder_conf: + hidden_size: 2 + normalize: utterance_mvn + normalize_conf: {} + model_conf: + ctc_weight: 0.3 + lsm_weight: 0.1 + length_normalized_loss: false + frontend: default + frontend_conf: + n_fft: 512 + win_length: 400 + hop_length: 160 + +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:144 | Infer config content: +num_device: 1 +num_nodes: 1 +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +parallel: + env: local + n_workers: 1 +model: + _target_: espnet2.bin.asr_inference.Speech2Text + asr_train_config: ./exp/mini_an4_asr_debug/config.yaml + asr_model_file: ./exp/mini_an4_asr_debug/last.ckpt + beam_size: 1 + ctc_weight: 0.3 +tokenizer: + vocab_size: 30 + character_coverage: 1.0 + model_type: bpe + save_path: ./data/bpe_30 + +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:148 | Measure config content: +recipe_dir: . +data_dir: ./data +exp_tag: mini_an4_asr_debug +exp_dir: ./exp/mini_an4_asr_debug +stats_dir: ./exp/stats +decode_dir: ./exp/mini_an4_asr_debug/decode +dataset_dir: ./data/mini_an4 +dataset: + _target_: espnet3.components.data.data_organizer.DataOrganizer + test: + - name: test + dataset: + _target_: src.dataset.MiniAN4Dataset + manifest_path: ./data/mini_an4/manifest/test.tsv +metrics: +- metric: + _target_: espnet3.systems.asr.metrics.wer.WER + clean_types: null +- metric: + _target_: espnet3.systems.asr.metrics.cer.CER + clean_types: null + +2026-01-08 19:24:38 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:49 | Initialized ASRSystem with train_config=True infer_config=True measure_config=True exp_dir=exp/train_asr_rnn_data_aug_debug +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:165 | System: ASRSystem +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:166 | Requested stages: ['all'] +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/TEMPLATE/asr/run.py:167 | Resolved stages: ['create_dataset', 'train_tokenizer', 'collect_stats', 'train', 'infer', 'measure', 'publish'] +2026-01-08 19:24:38 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: create_dataset === +2026-01-08 19:24:38 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:54 | ASRSystem.create_dataset(): starting dataset creation process +2026-01-08 19:24:38 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:63 | Creating dataset with function src.create_dataset.create_dataset +2026-01-08 19:24:39 | INFO | src.create_dataset | /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/src/create_dataset.py:148 | Prepared Mini AN4 manifests under data/mini_an4/manifest +2026-01-08 19:24:39 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:65 | Dataset creation completed in 0.16s using src.create_dataset.create_dataset +2026-01-08 19:24:39 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: create_dataset (0.16s) === +2026-01-08 19:24:39 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train_tokenizer === +2026-01-08 19:24:39 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:115 | Tokenizer already exists. Skipping train_tokenizer(). +2026-01-08 19:24:39 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: train_tokenizer (0.00s) === +2026-01-08 19:24:39 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: collect_stats === +2026-01-08 19:24:39 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:79 | Collecting stats | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:24:46 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:24:46 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:24:46 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 19:24:46 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 19:24:46 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 19:24:46 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 19:24:47 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:24:48 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:24:48 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:70 | Collect stats finished in 9.26s | exp_dir=./exp/train_asr_rnn_data_aug_debug stats_dir=./exp/stats +2026-01-08 19:24:48 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:74 | === [DONE] stage: collect_stats (9.27s) === +2026-01-08 19:24:48 | INFO | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:59 | === [START] stage: train === +2026-01-08 19:24:48 | INFO | espnet3.systems.asr.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py:82 | ASRSystem.train(): starting training process +2026-01-08 19:24:48 | INFO | espnet3.systems.base.system | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py:94 | Training start | exp_dir=./exp/train_asr_rnn_data_aug_debug model= +2026-01-08 19:24:48 | INFO | root | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/task.py:548 | Vocabulary size: 30 +2026-01-08 19:24:48 | INFO | espnet3.systems.base.train | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py:33 | Model: +ESPnetASRModel( + (frontend): DefaultFrontend( + (stft): Stft(n_fft=512, win_length=400, hop_length=160, center=True, normalized=False, onesided=True) + (frontend): Frontend() + (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) + ) + (normalize): UtteranceMVN(norm_means=True, norm_vars=False) + (encoder): VGGRNNEncoder( + (enc): ModuleList( + (0): VGG2L( + (conv1_1): Conv2d(1, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv1_2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_1): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (conv2_2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (1): RNNP( + (birnn0): LSTM(2560, 2, batch_first=True, bidirectional=True) + (bt0): Linear(in_features=4, out_features=2, bias=True) + ) + ) + ) + (decoder): RNNDecoder( + (embed): Embedding(30, 2) + (dropout_emb): Dropout(p=0.0, inplace=False) + (decoder): ModuleList( + (0): LSTMCell(4, 2) + ) + (dropout_dec): ModuleList( + (0): Dropout(p=0.0, inplace=False) + ) + (output): Linear(in_features=2, out_features=30, bias=True) + (att_list): ModuleList( + (0): AttLoc( + (mlp_enc): Linear(in_features=2, out_features=320, bias=True) + (mlp_dec): Linear(in_features=2, out_features=320, bias=False) + (mlp_att): Linear(in_features=10, out_features=320, bias=False) + (loc_conv): Conv2d(1, 10, kernel_size=(1, 201), stride=(1, 1), padding=(0, 100), bias=False) + (gvec): Linear(in_features=320, out_features=1, bias=True) + ) + ) + ) + (criterion_att): LabelSmoothingLoss( + (criterion): KLDivLoss() + ) + (ctc): CTC( + (ctc_lo): Linear(in_features=2, out_features=30, bias=True) + (ctc_loss): CTCLoss() + ) +) +2026-01-08 19:24:48 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:155 | GPU available: True (cuda), used: True +2026-01-08 19:24:48 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:158 | TPU available: False, using: 0 TPU cores +2026-01-08 19:24:48 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_train_batches=1)` was configured so 1 batch per epoch will be used. +2026-01-08 19:24:48 | INFO | lightning.pytorch.utilities.rank_zero | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/setup.py:105 | `Trainer(limit_val_batches=1)` was configured so 1 batch will be used. +2026-01-08 19:24:52 | WARNING | py.warnings | /home/masao/.local/share/uv/python/cpython-3.11.13-linux-x86_64-gnu/lib/python3.11/warnings.py:110 | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/callbacks/model_checkpoint.py:751: Checkpoint directory /mnt/c/Users/might/Documents/git/espnets/espnet3/egs3/mini_an4/asr/exp/train_asr_rnn_data_aug_debug exists and is not empty. + +2026-01-08 19:24:52 | INFO | lightning.pytorch.accelerators.cuda | /mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/accelerators/cuda.py:61 | LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0] +2026-01-08 19:24:52 | ERROR | espnet3 | /mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py:70 | Stage 'train' failed after 3.81s +Traceback (most recent call last): + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/utils/stages.py", line 61, in run_stages + fn() + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/asr/system.py", line 93, in train + return super().train() + ^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/system.py", line 99, in train + return train(self.train_config) + ^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/systems/base/train.py", line 101, in train + trainer.fit(**fit_kwargs) + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/training/trainer.py", line 175, in fit + self.trainer.fit( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/trainer.py", line 560, in fit + call._call_and_handle_interrupt( + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/call.py", line 49, in _call_and_handle_interrupt + return trainer_fn(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/trainer.py", line 598, in _fit_impl + self._run(model, ckpt_path=ckpt_path) + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/trainer.py", line 987, in _run + self.strategy.setup(self) + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/strategies/strategy.py", line 159, in setup + self.setup_optimizers(trainer) + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/strategies/strategy.py", line 139, in setup_optimizers + self.optimizers, self.lr_scheduler_configs = _init_optimizers_and_lr_schedulers(self.lightning_module) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/core/optimizer.py", line 180, in _init_optimizers_and_lr_schedulers + optim_conf = call._call_lightning_module_hook(model.trainer, "configure_optimizers", pl_module=model) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/tools/.venv/lib/python3.11/site-packages/lightning/pytorch/trainer/call.py", line 177, in _call_lightning_module_hook + output = fn(*args, **kwargs) + ^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 367, in configure_optimizers + lr_scheduler = _build_lr_scheduler_config(scheduler) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 358, in _build_lr_scheduler_config + monitor = _get_val_scheduler_monitor() + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/c/Users/might/Documents/git/espnets/espnet3/espnet3/components/modeling/model.py", line 250, in _get_val_scheduler_monitor + raise ValueError("val_scheduler_criterion must be a string like 'valid/loss'") +ValueError: val_scheduler_criterion must be a string like 'valid/loss'