add dinoSR and SpidR

Files changed (16) hide show

DinoSR_original/config.yaml +74 -0
DinoSR_original/round_0/E1_best.pt +3 -0
DinoSR_original/round_0/E1_last.pt +3 -0
DinoSR_original/round_0/tensorboard/events.out.tfevents.1774341402.node20.1724484.0 +3 -0
DinoSR_reproduced/config.yaml +74 -0
DinoSR_reproduced/round_0/E1_best.pt +3 -0
DinoSR_reproduced/round_0/E1_last.pt +3 -0
DinoSR_reproduced/round_0/tensorboard/events.out.tfevents.1774341408.node21.246280.0 +3 -0
SpidR/256/config.yaml +74 -0
SpidR/256/round_0/E1_best.pt +3 -0
SpidR/256/round_0/E1_last.pt +3 -0
SpidR/256/round_0/tensorboard/events.out.tfevents.1774296494.node16.189390.0 +3 -0
SpidR/256_no_extra_augs/config.yaml +74 -0
SpidR/256_no_extra_augs/round_0/E1_best.pt +3 -0
SpidR/256_no_extra_augs/round_0/E1_last.pt +3 -0
SpidR/256_no_extra_augs/round_0/tensorboard/events.out.tfevents.1774345454.node47.1425577.0 +3 -0

DinoSR_original/config.yaml ADDED Viewed

	@@ -0,0 +1,74 @@

+training:
+  run_name: dinosr_base_original
+  epochs: 150
+  learning_rate: 0.0001
+  log_interval: 100
+  checkpoint_dir: null
+  resume_from: /home/infres/abrik-22/snlp_project/outputs/dinosr_base_original/2026-03-23/09-35-33/round_0/E1_last.pt
+  n_iterative_pseudolabeling: 3
+  lr_scheduler:
+    _target_: torch.optim.lr_scheduler.CosineAnnealingLR
+    T_max: ${training.epochs}
+    eta_min: 1.0e-06
+  lr_scheduler_start_epoch: 150
+dataset:
+  root: data/LibriSpeech
+  train_split: train-clean-100
+  test_split: test-clean
+  batch_size: 32
+  num_workers: 1
+  noise_dir: noise_fullband
+  max_audio_length: 160000
+  augmentations:
+    max_augs: 4
+    time_stretch: true
+    pitch_shift: true
+    reverberation: true
+    noise: true
+    rir_dir: data/rirs
+    activate_extra_augs: true
+    echo:
+      enabled: true
+      volume_range:
+      - 0.1
+      - 0.5
+      duration_range:
+      - 0.1
+      - 0.5
+    random_noise:
+      enabled: true
+      noise_std: 0.001
+    pink_noise:
+      enabled: true
+      noise_std: 0.01
+    lowpass_filter:
+      enabled: true
+      cutoff_freq: 5000
+    highpass_filter:
+      enabled: true
+      cutoff_freq: 500
+    bandpass_filter:
+      enabled: true
+      cutoff_freq_low: 300
+      cutoff_freq_high: 8000
+    smooth:
+      enabled: true
+      window_size_range:
+      - 2
+      - 10
+    boost_audio:
+      enabled: true
+      amount: 20
+    duck_audio:
+      enabled: true
+      amount: 20
+    updownresample:
+      enabled: true
+      intermediate_freq: 32000
+model:
+  name: dinosr_base_original
+  layer: 5
+  vocab_size: 256
+  kind_kmeans: kmeans
+  quantizer:
+    hidden_dim: 256

DinoSR_original/round_0/E1_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ebba1a60f7464cc06a2b38222f07471b2856ee58aafbdbbbf2906ec92b690c9
+size 3961480

DinoSR_original/round_0/E1_last.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df12f6bd780bdae783bdf453a3e64db055aa36f833332e5ec995c4549d49a501
+size 3961480

DinoSR_original/round_0/tensorboard/events.out.tfevents.1774341402.node20.1724484.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42b81295047bef9b42ae3f165cdf91c3cedc09223d3c8259e2c8ff55d9a54bfd
+size 8152

DinoSR_reproduced/config.yaml ADDED Viewed

	@@ -0,0 +1,74 @@

+training:
+  run_name: dinosr_base_reproduced
+  epochs: 150
+  learning_rate: 0.0001
+  log_interval: 100
+  checkpoint_dir: null
+  resume_from: /home/infres/abrik-22/snlp_project/outputs/dinosr_base_reproduced/2026-03-23/09-34-30/round_0/E1_last.pt
+  n_iterative_pseudolabeling: 3
+  lr_scheduler:
+    _target_: torch.optim.lr_scheduler.CosineAnnealingLR
+    T_max: ${training.epochs}
+    eta_min: 1.0e-06
+  lr_scheduler_start_epoch: 150
+dataset:
+  root: data/LibriSpeech
+  train_split: train-clean-100
+  test_split: test-clean
+  batch_size: 32
+  num_workers: 1
+  noise_dir: noise_fullband
+  max_audio_length: 160000
+  augmentations:
+    max_augs: 4
+    time_stretch: true
+    pitch_shift: true
+    reverberation: true
+    noise: true
+    rir_dir: data/rirs
+    activate_extra_augs: true
+    echo:
+      enabled: true
+      volume_range:
+      - 0.1
+      - 0.5
+      duration_range:
+      - 0.1
+      - 0.5
+    random_noise:
+      enabled: true
+      noise_std: 0.001
+    pink_noise:
+      enabled: true
+      noise_std: 0.01
+    lowpass_filter:
+      enabled: true
+      cutoff_freq: 5000
+    highpass_filter:
+      enabled: true
+      cutoff_freq: 500
+    bandpass_filter:
+      enabled: true
+      cutoff_freq_low: 300
+      cutoff_freq_high: 8000
+    smooth:
+      enabled: true
+      window_size_range:
+      - 2
+      - 10
+    boost_audio:
+      enabled: true
+      amount: 20
+    duck_audio:
+      enabled: true
+      amount: 20
+    updownresample:
+      enabled: true
+      intermediate_freq: 32000
+model:
+  name: dinosr_base_reproduced
+  layer: 5
+  vocab_size: 256
+  kind_kmeans: kmeans
+  quantizer:
+    hidden_dim: 256

DinoSR_reproduced/round_0/E1_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2150f0bdc702335f6793473834b6603b57af0ef4c212a2dcbf3c992304915334
+size 3961544

DinoSR_reproduced/round_0/E1_last.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2314b20a8f777ad78c5ecd3043e1da9252c286b3d63039f100a3ce4d3d7aa95a
+size 3961544

DinoSR_reproduced/round_0/tensorboard/events.out.tfevents.1774341408.node21.246280.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb9d9ed16084d176fd4fcecafb3608b5f4970f19faacefff99067021db6528bc
+size 7712

SpidR/256/config.yaml ADDED Viewed

	@@ -0,0 +1,74 @@

+training:
+  run_name: spidr
+  epochs: 150
+  learning_rate: 0.0001
+  log_interval: 100
+  checkpoint_dir: null
+  resume_from: /home/infres/abrik-22/snlp_project/outputs/256/2026-03-22/18-41-33/round_0/E1_last.pt
+  n_iterative_pseudolabeling: 3
+  lr_scheduler:
+    _target_: torch.optim.lr_scheduler.CosineAnnealingLR
+    T_max: ${training.epochs}
+    eta_min: 1.0e-06
+  lr_scheduler_start_epoch: 150
+dataset:
+  root: data/LibriSpeech
+  train_split: train-clean-100
+  test_split: test-clean
+  batch_size: 32
+  num_workers: 1
+  noise_dir: noise_fullband
+  max_audio_length: 160000
+  augmentations:
+    max_augs: 4
+    time_stretch: true
+    pitch_shift: true
+    reverberation: true
+    noise: true
+    rir_dir: data/rirs
+    activate_extra_augs: true
+    echo:
+      enabled: true
+      volume_range:
+      - 0.1
+      - 0.5
+      duration_range:
+      - 0.1
+      - 0.5
+    random_noise:
+      enabled: true
+      noise_std: 0.001
+    pink_noise:
+      enabled: true
+      noise_std: 0.01
+    lowpass_filter:
+      enabled: true
+      cutoff_freq: 5000
+    highpass_filter:
+      enabled: true
+      cutoff_freq: 500
+    bandpass_filter:
+      enabled: true
+      cutoff_freq_low: 300
+      cutoff_freq_high: 8000
+    smooth:
+      enabled: true
+      window_size_range:
+      - 2
+      - 10
+    boost_audio:
+      enabled: true
+      amount: 20
+    duck_audio:
+      enabled: true
+      amount: 20
+    updownresample:
+      enabled: true
+      intermediate_freq: 32000
+model:
+  name: spidr_base
+  layer: 6
+  vocab_size: 256
+  kind_kmeans: kmeans
+  quantizer:
+    hidden_dim: 256

SpidR/256/round_0/E1_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:060e9fad2b4a5f9262485c582518b28145c51161e5bf54798492aac004813649
+size 3961544

SpidR/256/round_0/E1_last.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:884c648614fd0ba0826a5d7a84c8a20c10ca3a5428a80ffdd5a8072ce7875cfd
+size 3961544

SpidR/256/round_0/tensorboard/events.out.tfevents.1774296494.node16.189390.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:67b5d59c76d66df40fad02b56b65224fef5b3975147de09c5568b59768cc6595
+size 15116

SpidR/256_no_extra_augs/config.yaml ADDED Viewed

	@@ -0,0 +1,74 @@

+training:
+  run_name: spidr_base
+  epochs: 150
+  learning_rate: 0.0001
+  log_interval: 100
+  checkpoint_dir: null
+  resume_from: /home/infres/abrik-22/snlp_project/outputs/spidr_base/2026-03-23/22-15-04/round_0/E1_last.pt
+  n_iterative_pseudolabeling: 3
+  lr_scheduler:
+    _target_: torch.optim.lr_scheduler.CosineAnnealingLR
+    T_max: ${training.epochs}
+    eta_min: 1.0e-06
+  lr_scheduler_start_epoch: 150
+dataset:
+  root: data/LibriSpeech
+  train_split: train-clean-100
+  test_split: test-clean
+  batch_size: 32
+  num_workers: 1
+  noise_dir: noise_fullband
+  max_audio_length: 160000
+  augmentations:
+    max_augs: 1
+    time_stretch: true
+    pitch_shift: true
+    reverberation: true
+    noise: true
+    rir_dir: data/rirs
+    activate_extra_augs: false
+    echo:
+      enabled: true
+      volume_range:
+      - 0.1
+      - 0.5
+      duration_range:
+      - 0.1
+      - 0.5
+    random_noise:
+      enabled: true
+      noise_std: 0.001
+    pink_noise:
+      enabled: true
+      noise_std: 0.01
+    lowpass_filter:
+      enabled: true
+      cutoff_freq: 5000
+    highpass_filter:
+      enabled: true
+      cutoff_freq: 500
+    bandpass_filter:
+      enabled: true
+      cutoff_freq_low: 300
+      cutoff_freq_high: 8000
+    smooth:
+      enabled: true
+      window_size_range:
+      - 2
+      - 10
+    boost_audio:
+      enabled: true
+      amount: 20
+    duck_audio:
+      enabled: true
+      amount: 20
+    updownresample:
+      enabled: true
+      intermediate_freq: 32000
+model:
+  name: spidr_base
+  layer: 6
+  vocab_size: 256
+  kind_kmeans: kmeans
+  quantizer:
+    hidden_dim: 256

SpidR/256_no_extra_augs/round_0/E1_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a2a2d11d84fd6eeaf38325341a90b02e18c30506fc527655c1667f2f50cc058
+size 3961608

SpidR/256_no_extra_augs/round_0/E1_last.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cae54872e8b5f7a7efa3d120fdc456b6ce375e4f024bd226cde2e4e51db0007e
+size 3961608

SpidR/256_no_extra_augs/round_0/tensorboard/events.out.tfevents.1774345454.node47.1425577.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b24e73db74ad8005cca1f249be0c046d577920fe06b0db057cd2617e7c95c04
+size 9060