tky823 commited on
Commit
3f89dd5
·
verified ·
1 Parent(s): 264eca2

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/README.md +5 -0
  2. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/config.yaml +221 -0
  3. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/hydra.yaml +189 -0
  4. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/overrides.yaml +16 -0
  5. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/resolved_config.yaml +280 -0
  6. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/train.log +0 -0
  7. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/model/best_epoch.pth +3 -0
  8. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/model/last.pth +3 -0
  9. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/config.yaml +223 -0
  10. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/hydra.yaml +189 -0
  11. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/overrides.yaml +16 -0
  12. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/resolved_config.yaml +282 -0
  13. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/train.log +0 -0
  14. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/model/best_epoch.pth +3 -0
  15. recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/model/last.pth +3 -0
  16. recipes/BirdCLEF2025/ConvNeXtTiny/tensorboard/20250429-091731/events.out.tfevents.1746371437.MacBook-Pro-2.local.7605.0 +3 -0
  17. recipes/BirdCLEF2025/ConvNeXtTiny/tensorboard/20250429-174600/events.out.tfevents.1746371438.MacBook-Pro-2.local.7605.1 +3 -0
  18. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/README.md +7 -0
  19. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/config.yaml +219 -0
  20. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/hydra.yaml +189 -0
  21. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/overrides.yaml +16 -0
  22. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/resolved_config.yaml +278 -0
  23. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/train.log +0 -0
  24. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/model/best_epoch.pth +3 -0
  25. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/model/last.pth +3 -0
  26. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/README.md +7 -0
  27. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/config.yaml +219 -0
  28. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/hydra.yaml +189 -0
  29. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/overrides.yaml +16 -0
  30. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/resolved_config.yaml +278 -0
  31. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/train.log +0 -0
  32. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/model/best_epoch.pth +3 -0
  33. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/model/last.pth +3 -0
  34. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/README.md +7 -0
  35. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/config.yaml +221 -0
  36. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/hydra.yaml +189 -0
  37. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/overrides.yaml +16 -0
  38. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/resolved_config.yaml +280 -0
  39. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/train.log +0 -0
  40. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/model/best_epoch.pth +3 -0
  41. recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/model/last.pth +3 -0
  42. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/README.md +7 -0
  43. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/config.yaml +221 -0
  44. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/hydra.yaml +189 -0
  45. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/overrides.yaml +16 -0
  46. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/resolved_config.yaml +280 -0
  47. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/train.log +0 -0
  48. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/model/best_epoch.pth +3 -0
  49. recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/model/last.pth +3 -0
  50. recipes/BirdCLEF2025/EfficientNetB0/exp/20250429-075315/README.md +7 -0
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/README.md ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ system=default_seed-0
2
+ data=birdclef2025_15s
3
+ train=birdclef2025_convnext_tiny
4
+ model=birdclef2025_convnext_tiny
5
+ criterion=birdclef2025_categorical_cross_entropy
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/config.yaml ADDED
@@ -0,0 +1,221 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: null
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: null
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: ${..audio.sample_rate}
47
+ hop_length: 1253
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: ${..train.audio_key}
86
+ sample_rate_key: ${..train.sample_rate_key}
87
+ label_name_key: ${..train.label_name_key}
88
+ filename_key: ${..train.filename_key}
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
98
+ melspectrogram_transform: ${data.melspectrogram}
99
+ audio_key: audio
100
+ sample_rate_key: sample_rate
101
+ label_name_key: primary_label
102
+ filename_key: filename
103
+ waveform_key: waveform
104
+ melspectrogram_key: log_melspectrogram
105
+ label_index_key: label_index
106
+ sample_rate: ${data.audio.sample_rate}
107
+ duration: ${data.audio.duration}
108
+ decode_audio_as_waveform: true
109
+ decode_audio_as_monoral: true
110
+ training: true
111
+ melspectrogram_key: ${.composer.melspectrogram_key}
112
+ label_index_key: ${.composer.label_index_key}
113
+ alpha: 0.4
114
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
115
+ validation:
116
+ _target_: torch.utils.data.DataLoader
117
+ batch_size: 64
118
+ shuffle: false
119
+ collate_fn:
120
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
121
+ composer:
122
+ _target_: ${....train.collate_fn.composer._target_}
123
+ melspectrogram_transform: ${....train.collate_fn.composer.melspectrogram_transform}
124
+ audio_key: ${....train.collate_fn.composer.audio_key}
125
+ sample_rate_key: ${....train.collate_fn.composer.sample_rate_key}
126
+ label_name_key: ${....train.collate_fn.composer.label_name_key}
127
+ filename_key: ${....train.collate_fn.composer.filename_key}
128
+ waveform_key: ${....train.collate_fn.composer.waveform_key}
129
+ melspectrogram_key: ${....train.collate_fn.composer.melspectrogram_key}
130
+ label_index_key: ${....train.collate_fn.composer.label_index_key}
131
+ sample_rate: ${....train.collate_fn.composer.sample_rate}
132
+ duration: ${....train.collate_fn.composer.duration}
133
+ decode_audio_as_waveform: ${....train.collate_fn.composer.decode_audio_as_waveform}
134
+ decode_audio_as_monoral: ${....train.collate_fn.composer.decode_audio_as_monoral}
135
+ training: false
136
+ melspectrogram_key: ${...train.collate_fn.composer.melspectrogram_key}
137
+ label_index_key: ${...train.collate_fn.composer.label_index_key}
138
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
139
+ clip_gradient: {}
140
+ record: {}
141
+ trainer:
142
+ _target_: birdclef2025.utils.driver.BaseTrainer
143
+ key_mapping:
144
+ train:
145
+ input:
146
+ input: ${....dataloader.train.collate_fn.composer.melspectrogram_key}
147
+ output: logit
148
+ validation: ${.train}
149
+ inference: ${.validation}
150
+ ddp_kwargs: null
151
+ resume:
152
+ continue_from: ''
153
+ output:
154
+ exp_dir: ./exp/20250429-091731
155
+ tensorboard_dir: ./tensorboard/20250429-091731
156
+ save_checkpoint:
157
+ iteration:
158
+ every: 1000
159
+ path: ${...exp_dir}/model/iteration{iteration}.pth
160
+ epoch:
161
+ every: 1
162
+ path: ${...exp_dir}/model/epoch{epoch}.pth
163
+ last:
164
+ path: ${...exp_dir}/model/last.pth
165
+ best_epoch:
166
+ path: ${...exp_dir}/model/best_epoch.pth
167
+ steps:
168
+ epochs: 10
169
+ iterations: null
170
+ lr_scheduler: epoch
171
+ test:
172
+ dataset:
173
+ test:
174
+ _target_: torch.utils.data.Dataset
175
+ dataloader:
176
+ test:
177
+ _target_: torch.utils.data.DataLoader
178
+ batch_size: 1
179
+ shuffle: false
180
+ key_mapping:
181
+ inference:
182
+ input: null
183
+ output: null
184
+ identifier: null
185
+ checkpoint: null
186
+ remove_weight_norm: null
187
+ output:
188
+ exp_dir: ./exp
189
+ inference_dir: ${.exp_dir}/inference
190
+ audio:
191
+ sample_rate: ${data.audio.sample_rate}
192
+ key_mapping:
193
+ inference:
194
+ output: null
195
+ reference: null
196
+ transforms:
197
+ inference:
198
+ output: null
199
+ reference: null
200
+ model:
201
+ _target_: birdclef2025.models.ConvNeXtTiny
202
+ weights: ${const:torchvision.models.ConvNeXt_Tiny_Weights.IMAGENET1K_V1}
203
+ num_classes: ${const:birdclef2025.utils.data.birdclef.num_birdclef2025_primary_labels}
204
+ optimizer:
205
+ _target_: torch.optim.AdamW
206
+ lr: 0.0001
207
+ weight_decay: 0.05
208
+ lr_scheduler: {}
209
+ criterion:
210
+ _target_: audyn.criterion.MultiCriteria
211
+ cross_entropy:
212
+ _target_: audyn.criterion.BaseCriterionWrapper
213
+ criterion:
214
+ _target_: torch.nn.CrossEntropyLoss
215
+ reduction: mean
216
+ weight: 1
217
+ key_mapping:
218
+ estimated:
219
+ input: logit
220
+ target:
221
+ target: ${train.dataloader.train.collate_fn.composer.label_index_key}
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/hydra.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ./exp/20250429-091731/log/20250429-091735
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=./exp/20250429-091731/log/20250429-091735
114
+ - hydra.mode=RUN
115
+ task:
116
+ - system=cuda
117
+ - preprocess=birdclef2025
118
+ - data=birdclef2025_15s
119
+ - train=birdclef2025_convnext_tiny
120
+ - model=birdclef2025_convnext_tiny
121
+ - optimizer=adamw_1e-4_decay_5e-2
122
+ - lr_scheduler=none
123
+ - criterion=birdclef2025_categorical_cross_entropy
124
+ - preprocess.dump_format=birdclef2025
125
+ - train.dataset.train.list_path=dump/birdclef2025_15s/list/train.txt
126
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
127
+ - train.dataset.validation.list_path=dump/birdclef2025_15s/list/validation.txt
128
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
129
+ - train.resume.continue_from=
130
+ - train.output.exp_dir=./exp/20250429-091731
131
+ - train.output.tensorboard_dir=./tensorboard/20250429-091731
132
+ job:
133
+ name: train
134
+ chdir: false
135
+ override_dirname: criterion=birdclef2025_categorical_cross_entropy,data=birdclef2025_15s,lr_scheduler=none,model=birdclef2025_convnext_tiny,optimizer=adamw_1e-4_decay_5e-2,preprocess.dump_format=birdclef2025,preprocess=birdclef2025,system=cuda,train.dataset.train.feature_dir=/kaggle/input/birdclef-2025,train.dataset.train.list_path=dump/birdclef2025_15s/list/train.txt,train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025,train.dataset.validation.list_path=dump/birdclef2025_15s/list/validation.txt,train.output.exp_dir=./exp/20250429-091731,train.output.tensorboard_dir=./tensorboard/20250429-091731,train.resume.continue_from=,train=birdclef2025_convnext_tiny
136
+ id: ???
137
+ num: ???
138
+ config_name: config
139
+ env_set: {}
140
+ env_copy: []
141
+ config:
142
+ override_dirname:
143
+ kv_sep: '='
144
+ item_sep: ','
145
+ exclude_keys: []
146
+ runtime:
147
+ version: 1.3.2
148
+ version_base: '1.2'
149
+ cwd: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/ConvNeXtTiny
150
+ config_sources:
151
+ - path: hydra.conf
152
+ schema: pkg
153
+ provider: hydra
154
+ - path: /usr/local/lib/python3.10/dist-packages/audyn/configs
155
+ schema: file
156
+ provider: main
157
+ - path: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/ConvNeXtTiny/conf
158
+ schema: file
159
+ provider: command-line
160
+ - path: ''
161
+ schema: structured
162
+ provider: schema
163
+ output_dir: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735
164
+ choices:
165
+ criterion: birdclef2025_categorical_cross_entropy
166
+ lr_scheduler: none
167
+ optimizer: adamw_1e-4_decay_5e-2
168
+ model: birdclef2025_convnext_tiny
169
+ test: default
170
+ test/dataloader: default
171
+ test/dataset: default
172
+ train: birdclef2025_convnext_tiny
173
+ train/record: default
174
+ train/clip_gradient: default
175
+ train/dataloader: default
176
+ train/dataset: birdclef2025_primary-label
177
+ data: birdclef2025_15s
178
+ preprocess: birdclef2025
179
+ system: cuda
180
+ hydra/env: default
181
+ hydra/callbacks: null
182
+ hydra/job_logging: default
183
+ hydra/hydra_logging: default
184
+ hydra/hydra_help: default
185
+ hydra/help: default
186
+ hydra/sweeper: basic
187
+ hydra/launcher: basic
188
+ hydra/output: default
189
+ verbose: false
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/overrides.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - system=cuda
2
+ - preprocess=birdclef2025
3
+ - data=birdclef2025_15s
4
+ - train=birdclef2025_convnext_tiny
5
+ - model=birdclef2025_convnext_tiny
6
+ - optimizer=adamw_1e-4_decay_5e-2
7
+ - lr_scheduler=none
8
+ - criterion=birdclef2025_categorical_cross_entropy
9
+ - preprocess.dump_format=birdclef2025
10
+ - train.dataset.train.list_path=dump/birdclef2025_15s/list/train.txt
11
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
12
+ - train.dataset.validation.list_path=dump/birdclef2025_15s/list/validation.txt
13
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
14
+ - train.resume.continue_from=
15
+ - train.output.exp_dir=./exp/20250429-091731
16
+ - train.output.tensorboard_dir=./tensorboard/20250429-091731
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/.hydra/resolved_config.yaml ADDED
@@ -0,0 +1,280 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: false
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: 2
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: 32000
47
+ hop_length: 1253
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: audio
86
+ sample_rate_key: sample_rate
87
+ label_name_key: primary_label
88
+ filename_key: filename
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
98
+ melspectrogram_transform:
99
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
100
+ sample_rate: 32000
101
+ hop_length: 1253
102
+ f_min: 20
103
+ f_max: 16000
104
+ pad: 0
105
+ n_mels: 128
106
+ window_fn:
107
+ _target_: torch.hann_window
108
+ _partial_: true
109
+ power: 1.0
110
+ normalized: false
111
+ wkwargs: null
112
+ center: true
113
+ pad_mode: constant
114
+ onesided: null
115
+ norm: slaney
116
+ mel_scale: slaney
117
+ take_log: true
118
+ freq_mask_param:
119
+ - 0.06
120
+ - 0.1
121
+ time_mask_param:
122
+ - 0.06
123
+ - 0.12
124
+ eps: null
125
+ audio_key: audio
126
+ sample_rate_key: sample_rate
127
+ label_name_key: primary_label
128
+ filename_key: filename
129
+ waveform_key: waveform
130
+ melspectrogram_key: log_melspectrogram
131
+ label_index_key: label_index
132
+ sample_rate: 32000
133
+ duration: 15
134
+ decode_audio_as_waveform: true
135
+ decode_audio_as_monoral: true
136
+ training: true
137
+ melspectrogram_key: log_melspectrogram
138
+ label_index_key: label_index
139
+ alpha: 0.4
140
+ num_workers: 2
141
+ validation:
142
+ _target_: torch.utils.data.DataLoader
143
+ batch_size: 64
144
+ shuffle: false
145
+ collate_fn:
146
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
147
+ composer:
148
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
149
+ melspectrogram_transform:
150
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
151
+ sample_rate: 32000
152
+ hop_length: 1253
153
+ f_min: 20
154
+ f_max: 16000
155
+ pad: 0
156
+ n_mels: 128
157
+ window_fn:
158
+ _target_: torch.hann_window
159
+ _partial_: true
160
+ power: 1.0
161
+ normalized: false
162
+ wkwargs: null
163
+ center: true
164
+ pad_mode: constant
165
+ onesided: null
166
+ norm: slaney
167
+ mel_scale: slaney
168
+ take_log: true
169
+ freq_mask_param:
170
+ - 0.06
171
+ - 0.1
172
+ time_mask_param:
173
+ - 0.06
174
+ - 0.12
175
+ eps: null
176
+ audio_key: audio
177
+ sample_rate_key: sample_rate
178
+ label_name_key: primary_label
179
+ filename_key: filename
180
+ waveform_key: waveform
181
+ melspectrogram_key: log_melspectrogram
182
+ label_index_key: label_index
183
+ sample_rate: 32000
184
+ duration: 15
185
+ decode_audio_as_waveform: true
186
+ decode_audio_as_monoral: true
187
+ training: false
188
+ melspectrogram_key: log_melspectrogram
189
+ label_index_key: label_index
190
+ num_workers: 2
191
+ clip_gradient: {}
192
+ record: {}
193
+ trainer:
194
+ _target_: birdclef2025.utils.driver.BaseTrainer
195
+ key_mapping:
196
+ train:
197
+ input:
198
+ input: log_melspectrogram
199
+ output: logit
200
+ validation:
201
+ input:
202
+ input: log_melspectrogram
203
+ output: logit
204
+ inference:
205
+ input:
206
+ input: log_melspectrogram
207
+ output: logit
208
+ ddp_kwargs: null
209
+ resume:
210
+ continue_from: ''
211
+ output:
212
+ exp_dir: ./exp/20250429-091731
213
+ tensorboard_dir: ./tensorboard/20250429-091731
214
+ save_checkpoint:
215
+ iteration:
216
+ every: 1000
217
+ path: ./exp/20250429-091731/model/iteration{iteration}.pth
218
+ epoch:
219
+ every: 1
220
+ path: ./exp/20250429-091731/model/epoch{epoch}.pth
221
+ last:
222
+ path: ./exp/20250429-091731/model/last.pth
223
+ best_epoch:
224
+ path: ./exp/20250429-091731/model/best_epoch.pth
225
+ steps:
226
+ epochs: 10
227
+ iterations: null
228
+ lr_scheduler: epoch
229
+ test:
230
+ dataset:
231
+ test:
232
+ _target_: torch.utils.data.Dataset
233
+ dataloader:
234
+ test:
235
+ _target_: torch.utils.data.DataLoader
236
+ batch_size: 1
237
+ shuffle: false
238
+ key_mapping:
239
+ inference:
240
+ input: null
241
+ output: null
242
+ identifier: null
243
+ checkpoint: null
244
+ remove_weight_norm: null
245
+ output:
246
+ exp_dir: ./exp
247
+ inference_dir: ./exp/inference
248
+ audio:
249
+ sample_rate: 32000
250
+ key_mapping:
251
+ inference:
252
+ output: null
253
+ reference: null
254
+ transforms:
255
+ inference:
256
+ output: null
257
+ reference: null
258
+ ddp_kwargs: null
259
+ model:
260
+ _target_: birdclef2025.models.ConvNeXtTiny
261
+ weights: IMAGENET1K_V1
262
+ num_classes: 206
263
+ optimizer:
264
+ _target_: torch.optim.AdamW
265
+ lr: 0.0001
266
+ weight_decay: 0.05
267
+ lr_scheduler: {}
268
+ criterion:
269
+ _target_: audyn.criterion.MultiCriteria
270
+ cross_entropy:
271
+ _target_: audyn.criterion.BaseCriterionWrapper
272
+ criterion:
273
+ _target_: torch.nn.CrossEntropyLoss
274
+ reduction: mean
275
+ weight: 1
276
+ key_mapping:
277
+ estimated:
278
+ input: logit
279
+ target:
280
+ target: label_index
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/log/20250429-091735/train.log ADDED
The diff for this file is too large to render. See raw diff
 
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/model/best_epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c8c76a73f858b31c3e5e91cedb5bec0403da0ca62ebdd29cf069f83c4e130ff
3
+ size 335992470
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-091731/model/last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eaca39c63d46df4018baadf070d222fdf55f1e611da5930fc7c02009442a642
3
+ size 335953326
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/config.yaml ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: null
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: null
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: ${..audio.sample_rate}
47
+ hop_length: 512
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_reshape_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_reshape_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: ${..train.audio_key}
86
+ sample_rate_key: ${..train.sample_rate_key}
87
+ label_name_key: ${..train.label_name_key}
88
+ filename_key: ${..train.filename_key}
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
98
+ melspectrogram_transform: ${data.melspectrogram}
99
+ audio_key: audio
100
+ sample_rate_key: sample_rate
101
+ label_name_key: primary_label
102
+ filename_key: filename
103
+ waveform_key: waveform
104
+ melspectrogram_key: log_melspectrogram
105
+ label_index_key: label_index
106
+ sample_rate: ${data.audio.sample_rate}
107
+ duration: ${data.audio.duration}
108
+ decode_audio_as_waveform: true
109
+ decode_audio_as_monoral: true
110
+ training: true
111
+ target_shape: 256
112
+ melspectrogram_key: ${.composer.melspectrogram_key}
113
+ label_index_key: ${.composer.label_index_key}
114
+ alpha: 0.4
115
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
116
+ validation:
117
+ _target_: torch.utils.data.DataLoader
118
+ batch_size: 64
119
+ shuffle: false
120
+ collate_fn:
121
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
122
+ composer:
123
+ _target_: ${....train.collate_fn.composer._target_}
124
+ melspectrogram_transform: ${....train.collate_fn.composer.melspectrogram_transform}
125
+ audio_key: ${....train.collate_fn.composer.audio_key}
126
+ sample_rate_key: ${....train.collate_fn.composer.sample_rate_key}
127
+ label_name_key: ${....train.collate_fn.composer.label_name_key}
128
+ filename_key: ${....train.collate_fn.composer.filename_key}
129
+ waveform_key: ${....train.collate_fn.composer.waveform_key}
130
+ melspectrogram_key: ${....train.collate_fn.composer.melspectrogram_key}
131
+ label_index_key: ${....train.collate_fn.composer.label_index_key}
132
+ sample_rate: ${....train.collate_fn.composer.sample_rate}
133
+ duration: ${....train.collate_fn.composer.duration}
134
+ decode_audio_as_waveform: ${....train.collate_fn.composer.decode_audio_as_waveform}
135
+ decode_audio_as_monoral: ${....train.collate_fn.composer.decode_audio_as_monoral}
136
+ training: false
137
+ target_shape: ${....train.collate_fn.composer.target_shape}
138
+ melspectrogram_key: ${...train.collate_fn.composer.melspectrogram_key}
139
+ label_index_key: ${...train.collate_fn.composer.label_index_key}
140
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
141
+ clip_gradient: {}
142
+ record: {}
143
+ trainer:
144
+ _target_: birdclef2025.utils.driver.BaseTrainer
145
+ key_mapping:
146
+ train:
147
+ input:
148
+ input: ${....dataloader.train.collate_fn.composer.melspectrogram_key}
149
+ output: logit
150
+ validation: ${.train}
151
+ inference: ${.validation}
152
+ ddp_kwargs: null
153
+ resume:
154
+ continue_from: ''
155
+ output:
156
+ exp_dir: ./exp/20250429-174600
157
+ tensorboard_dir: ./tensorboard/20250429-174600
158
+ save_checkpoint:
159
+ iteration:
160
+ every: 1000
161
+ path: ${...exp_dir}/model/iteration{iteration}.pth
162
+ epoch:
163
+ every: 1
164
+ path: ${...exp_dir}/model/epoch{epoch}.pth
165
+ last:
166
+ path: ${...exp_dir}/model/last.pth
167
+ best_epoch:
168
+ path: ${...exp_dir}/model/best_epoch.pth
169
+ steps:
170
+ epochs: 10
171
+ iterations: null
172
+ lr_scheduler: epoch
173
+ test:
174
+ dataset:
175
+ test:
176
+ _target_: torch.utils.data.Dataset
177
+ dataloader:
178
+ test:
179
+ _target_: torch.utils.data.DataLoader
180
+ batch_size: 1
181
+ shuffle: false
182
+ key_mapping:
183
+ inference:
184
+ input: null
185
+ output: null
186
+ identifier: null
187
+ checkpoint: null
188
+ remove_weight_norm: null
189
+ output:
190
+ exp_dir: ./exp
191
+ inference_dir: ${.exp_dir}/inference
192
+ audio:
193
+ sample_rate: ${data.audio.sample_rate}
194
+ key_mapping:
195
+ inference:
196
+ output: null
197
+ reference: null
198
+ transforms:
199
+ inference:
200
+ output: null
201
+ reference: null
202
+ model:
203
+ _target_: birdclef2025.models.ConvNeXtTiny
204
+ weights: ${const:torchvision.models.ConvNeXt_Tiny_Weights.IMAGENET1K_V1}
205
+ num_classes: ${const:birdclef2025.utils.data.birdclef.num_birdclef2025_primary_labels}
206
+ optimizer:
207
+ _target_: torch.optim.AdamW
208
+ lr: 0.0001
209
+ weight_decay: 0.05
210
+ lr_scheduler: {}
211
+ criterion:
212
+ _target_: audyn.criterion.MultiCriteria
213
+ cross_entropy:
214
+ _target_: audyn.criterion.BaseCriterionWrapper
215
+ criterion:
216
+ _target_: torch.nn.CrossEntropyLoss
217
+ reduction: mean
218
+ weight: 1
219
+ key_mapping:
220
+ estimated:
221
+ input: logit
222
+ target:
223
+ target: ${train.dataloader.train.collate_fn.composer.label_index_key}
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/hydra.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ./exp/20250429-174600/log/20250429-174603
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=./exp/20250429-174600/log/20250429-174603
114
+ - hydra.mode=RUN
115
+ task:
116
+ - system=cuda
117
+ - preprocess=birdclef2025
118
+ - data=birdclef2025_reshape_15s
119
+ - train=birdclef2025_reshape_convnext_tiny
120
+ - model=birdclef2025_convnext_tiny
121
+ - optimizer=adamw_1e-4_decay_5e-2
122
+ - lr_scheduler=none
123
+ - criterion=birdclef2025_categorical_cross_entropy
124
+ - preprocess.dump_format=birdclef2025
125
+ - train.dataset.train.list_path=dump/birdclef2025_reshape_15s/list/train.txt
126
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
127
+ - train.dataset.validation.list_path=dump/birdclef2025_reshape_15s/list/validation.txt
128
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
129
+ - train.resume.continue_from=
130
+ - train.output.exp_dir=./exp/20250429-174600
131
+ - train.output.tensorboard_dir=./tensorboard/20250429-174600
132
+ job:
133
+ name: train
134
+ chdir: false
135
+ override_dirname: criterion=birdclef2025_categorical_cross_entropy,data=birdclef2025_reshape_15s,lr_scheduler=none,model=birdclef2025_convnext_tiny,optimizer=adamw_1e-4_decay_5e-2,preprocess.dump_format=birdclef2025,preprocess=birdclef2025,system=cuda,train.dataset.train.feature_dir=/kaggle/input/birdclef-2025,train.dataset.train.list_path=dump/birdclef2025_reshape_15s/list/train.txt,train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025,train.dataset.validation.list_path=dump/birdclef2025_reshape_15s/list/validation.txt,train.output.exp_dir=./exp/20250429-174600,train.output.tensorboard_dir=./tensorboard/20250429-174600,train.resume.continue_from=,train=birdclef2025_reshape_convnext_tiny
136
+ id: ???
137
+ num: ???
138
+ config_name: config
139
+ env_set: {}
140
+ env_copy: []
141
+ config:
142
+ override_dirname:
143
+ kv_sep: '='
144
+ item_sep: ','
145
+ exclude_keys: []
146
+ runtime:
147
+ version: 1.3.2
148
+ version_base: '1.2'
149
+ cwd: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/ConvNeXtTiny
150
+ config_sources:
151
+ - path: hydra.conf
152
+ schema: pkg
153
+ provider: hydra
154
+ - path: /usr/local/lib/python3.10/dist-packages/audyn/configs
155
+ schema: file
156
+ provider: main
157
+ - path: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/ConvNeXtTiny/conf
158
+ schema: file
159
+ provider: command-line
160
+ - path: ''
161
+ schema: structured
162
+ provider: schema
163
+ output_dir: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603
164
+ choices:
165
+ criterion: birdclef2025_categorical_cross_entropy
166
+ lr_scheduler: none
167
+ optimizer: adamw_1e-4_decay_5e-2
168
+ model: birdclef2025_convnext_tiny
169
+ test: default
170
+ test/dataloader: default
171
+ test/dataset: default
172
+ train: birdclef2025_reshape_convnext_tiny
173
+ train/record: default
174
+ train/clip_gradient: default
175
+ train/dataloader: default
176
+ train/dataset: birdclef2025_primary-label
177
+ data: birdclef2025_reshape_15s
178
+ preprocess: birdclef2025
179
+ system: cuda
180
+ hydra/env: default
181
+ hydra/callbacks: null
182
+ hydra/job_logging: default
183
+ hydra/hydra_logging: default
184
+ hydra/hydra_help: default
185
+ hydra/help: default
186
+ hydra/sweeper: basic
187
+ hydra/launcher: basic
188
+ hydra/output: default
189
+ verbose: false
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/overrides.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - system=cuda
2
+ - preprocess=birdclef2025
3
+ - data=birdclef2025_reshape_15s
4
+ - train=birdclef2025_reshape_convnext_tiny
5
+ - model=birdclef2025_convnext_tiny
6
+ - optimizer=adamw_1e-4_decay_5e-2
7
+ - lr_scheduler=none
8
+ - criterion=birdclef2025_categorical_cross_entropy
9
+ - preprocess.dump_format=birdclef2025
10
+ - train.dataset.train.list_path=dump/birdclef2025_reshape_15s/list/train.txt
11
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
12
+ - train.dataset.validation.list_path=dump/birdclef2025_reshape_15s/list/validation.txt
13
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
14
+ - train.resume.continue_from=
15
+ - train.output.exp_dir=./exp/20250429-174600
16
+ - train.output.tensorboard_dir=./tensorboard/20250429-174600
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/.hydra/resolved_config.yaml ADDED
@@ -0,0 +1,282 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: false
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: 2
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: 32000
47
+ hop_length: 512
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_reshape_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_reshape_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: audio
86
+ sample_rate_key: sample_rate
87
+ label_name_key: primary_label
88
+ filename_key: filename
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
98
+ melspectrogram_transform:
99
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
100
+ sample_rate: 32000
101
+ hop_length: 512
102
+ f_min: 20
103
+ f_max: 16000
104
+ pad: 0
105
+ n_mels: 128
106
+ window_fn:
107
+ _target_: torch.hann_window
108
+ _partial_: true
109
+ power: 1.0
110
+ normalized: false
111
+ wkwargs: null
112
+ center: true
113
+ pad_mode: constant
114
+ onesided: null
115
+ norm: slaney
116
+ mel_scale: slaney
117
+ take_log: true
118
+ freq_mask_param:
119
+ - 0.06
120
+ - 0.1
121
+ time_mask_param:
122
+ - 0.06
123
+ - 0.12
124
+ eps: null
125
+ audio_key: audio
126
+ sample_rate_key: sample_rate
127
+ label_name_key: primary_label
128
+ filename_key: filename
129
+ waveform_key: waveform
130
+ melspectrogram_key: log_melspectrogram
131
+ label_index_key: label_index
132
+ sample_rate: 32000
133
+ duration: 15
134
+ decode_audio_as_waveform: true
135
+ decode_audio_as_monoral: true
136
+ training: true
137
+ target_shape: 256
138
+ melspectrogram_key: log_melspectrogram
139
+ label_index_key: label_index
140
+ alpha: 0.4
141
+ num_workers: 2
142
+ validation:
143
+ _target_: torch.utils.data.DataLoader
144
+ batch_size: 64
145
+ shuffle: false
146
+ collate_fn:
147
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
148
+ composer:
149
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
150
+ melspectrogram_transform:
151
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
152
+ sample_rate: 32000
153
+ hop_length: 512
154
+ f_min: 20
155
+ f_max: 16000
156
+ pad: 0
157
+ n_mels: 128
158
+ window_fn:
159
+ _target_: torch.hann_window
160
+ _partial_: true
161
+ power: 1.0
162
+ normalized: false
163
+ wkwargs: null
164
+ center: true
165
+ pad_mode: constant
166
+ onesided: null
167
+ norm: slaney
168
+ mel_scale: slaney
169
+ take_log: true
170
+ freq_mask_param:
171
+ - 0.06
172
+ - 0.1
173
+ time_mask_param:
174
+ - 0.06
175
+ - 0.12
176
+ eps: null
177
+ audio_key: audio
178
+ sample_rate_key: sample_rate
179
+ label_name_key: primary_label
180
+ filename_key: filename
181
+ waveform_key: waveform
182
+ melspectrogram_key: log_melspectrogram
183
+ label_index_key: label_index
184
+ sample_rate: 32000
185
+ duration: 15
186
+ decode_audio_as_waveform: true
187
+ decode_audio_as_monoral: true
188
+ training: false
189
+ target_shape: 256
190
+ melspectrogram_key: log_melspectrogram
191
+ label_index_key: label_index
192
+ num_workers: 2
193
+ clip_gradient: {}
194
+ record: {}
195
+ trainer:
196
+ _target_: birdclef2025.utils.driver.BaseTrainer
197
+ key_mapping:
198
+ train:
199
+ input:
200
+ input: log_melspectrogram
201
+ output: logit
202
+ validation:
203
+ input:
204
+ input: log_melspectrogram
205
+ output: logit
206
+ inference:
207
+ input:
208
+ input: log_melspectrogram
209
+ output: logit
210
+ ddp_kwargs: null
211
+ resume:
212
+ continue_from: ''
213
+ output:
214
+ exp_dir: ./exp/20250429-174600
215
+ tensorboard_dir: ./tensorboard/20250429-174600
216
+ save_checkpoint:
217
+ iteration:
218
+ every: 1000
219
+ path: ./exp/20250429-174600/model/iteration{iteration}.pth
220
+ epoch:
221
+ every: 1
222
+ path: ./exp/20250429-174600/model/epoch{epoch}.pth
223
+ last:
224
+ path: ./exp/20250429-174600/model/last.pth
225
+ best_epoch:
226
+ path: ./exp/20250429-174600/model/best_epoch.pth
227
+ steps:
228
+ epochs: 10
229
+ iterations: null
230
+ lr_scheduler: epoch
231
+ test:
232
+ dataset:
233
+ test:
234
+ _target_: torch.utils.data.Dataset
235
+ dataloader:
236
+ test:
237
+ _target_: torch.utils.data.DataLoader
238
+ batch_size: 1
239
+ shuffle: false
240
+ key_mapping:
241
+ inference:
242
+ input: null
243
+ output: null
244
+ identifier: null
245
+ checkpoint: null
246
+ remove_weight_norm: null
247
+ output:
248
+ exp_dir: ./exp
249
+ inference_dir: ./exp/inference
250
+ audio:
251
+ sample_rate: 32000
252
+ key_mapping:
253
+ inference:
254
+ output: null
255
+ reference: null
256
+ transforms:
257
+ inference:
258
+ output: null
259
+ reference: null
260
+ ddp_kwargs: null
261
+ model:
262
+ _target_: birdclef2025.models.ConvNeXtTiny
263
+ weights: IMAGENET1K_V1
264
+ num_classes: 206
265
+ optimizer:
266
+ _target_: torch.optim.AdamW
267
+ lr: 0.0001
268
+ weight_decay: 0.05
269
+ lr_scheduler: {}
270
+ criterion:
271
+ _target_: audyn.criterion.MultiCriteria
272
+ cross_entropy:
273
+ _target_: audyn.criterion.BaseCriterionWrapper
274
+ criterion:
275
+ _target_: torch.nn.CrossEntropyLoss
276
+ reduction: mean
277
+ weight: 1
278
+ key_mapping:
279
+ estimated:
280
+ input: logit
281
+ target:
282
+ target: label_index
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/log/20250429-174603/train.log ADDED
The diff for this file is too large to render. See raw diff
 
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/model/best_epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86838ad0507b599924a8eca92c0e9295cbd0fdd4858fd662153e1bdd4f710914
3
+ size 335992534
recipes/BirdCLEF2025/ConvNeXtTiny/exp/20250429-174600/model/last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e05e2aaadfca28516aeda2d907ddcba8accdb5118e03ce38f63ff28395b8a155
3
+ size 335953390
recipes/BirdCLEF2025/ConvNeXtTiny/tensorboard/20250429-091731/events.out.tfevents.1746371437.MacBook-Pro-2.local.7605.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:123ef3c4dcd02d0f1242a960e9c030ab8bddee904817d8759f7f1f2022f6dde1
3
+ size 472294
recipes/BirdCLEF2025/ConvNeXtTiny/tensorboard/20250429-174600/events.out.tfevents.1746371438.MacBook-Pro-2.local.7605.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dc80cd9207cda3799c3d6d15f9d93126653ea9174346166bb454b8c60954e6e
3
+ size 472294
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ system=default_seed-0
2
+ data=birdclef2025_5s
3
+ train=birdclef2025_efficientnet_b0
4
+ model=birdclef2025_efficientnet_b0
5
+ criterion=birdclef2025_categorical_cross_entropy
6
+
7
+ public_score: 0.479
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/config.yaml ADDED
@@ -0,0 +1,219 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: null
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: null
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 5
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: ${..audio.sample_rate}
47
+ hop_length: 1253
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_5s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_5s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: ${..train.audio_key}
86
+ sample_rate_key: ${..train.sample_rate_key}
87
+ label_name_key: ${..train.label_name_key}
88
+ filename_key: ${..train.filename_key}
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
98
+ melspectrogram_transform: ${data.melspectrogram}
99
+ audio_key: audio
100
+ sample_rate_key: sample_rate
101
+ label_name_key: primary_label
102
+ filename_key: filename
103
+ waveform_key: waveform
104
+ melspectrogram_key: log_melspectrogram
105
+ label_index_key: label_index
106
+ sample_rate: ${data.audio.sample_rate}
107
+ duration: ${data.audio.duration}
108
+ decode_audio_as_waveform: true
109
+ decode_audio_as_monoral: true
110
+ training: true
111
+ melspectrogram_key: ${.composer.melspectrogram_key}
112
+ label_index_key: ${.composer.label_index_key}
113
+ alpha: 0.4
114
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
115
+ validation:
116
+ _target_: torch.utils.data.DataLoader
117
+ batch_size: 64
118
+ shuffle: false
119
+ collate_fn:
120
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
121
+ composer:
122
+ _target_: ${....train.collate_fn.composer._target_}
123
+ melspectrogram_transform: ${....train.collate_fn.composer.melspectrogram_transform}
124
+ audio_key: ${....train.collate_fn.composer.audio_key}
125
+ sample_rate_key: ${....train.collate_fn.composer.sample_rate_key}
126
+ label_name_key: ${....train.collate_fn.composer.label_name_key}
127
+ filename_key: ${....train.collate_fn.composer.filename_key}
128
+ waveform_key: ${....train.collate_fn.composer.waveform_key}
129
+ melspectrogram_key: ${....train.collate_fn.composer.melspectrogram_key}
130
+ label_index_key: ${....train.collate_fn.composer.label_index_key}
131
+ sample_rate: ${....train.collate_fn.composer.sample_rate}
132
+ duration: ${....train.collate_fn.composer.duration}
133
+ decode_audio_as_waveform: ${....train.collate_fn.composer.decode_audio_as_waveform}
134
+ decode_audio_as_monoral: ${....train.collate_fn.composer.decode_audio_as_monoral}
135
+ training: false
136
+ melspectrogram_key: ${...train.collate_fn.composer.melspectrogram_key}
137
+ label_index_key: ${...train.collate_fn.composer.label_index_key}
138
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
139
+ clip_gradient: {}
140
+ record: {}
141
+ trainer:
142
+ _target_: birdclef2025.utils.driver.BaseTrainer
143
+ key_mapping:
144
+ train:
145
+ input:
146
+ input: ${....dataloader.train.collate_fn.composer.melspectrogram_key}
147
+ output: logit
148
+ validation: ${.train}
149
+ inference: ${.validation}
150
+ ddp_kwargs: null
151
+ resume:
152
+ continue_from: ''
153
+ output:
154
+ exp_dir: ./exp/20250427-104215
155
+ tensorboard_dir: ./tensorboard/20250427-104215
156
+ save_checkpoint:
157
+ iteration:
158
+ every: 1000
159
+ path: ${...exp_dir}/model/iteration{iteration}.pth
160
+ epoch:
161
+ every: 1
162
+ path: ${...exp_dir}/model/epoch{epoch}.pth
163
+ last:
164
+ path: ${...exp_dir}/model/last.pth
165
+ best_epoch:
166
+ path: ${...exp_dir}/model/best_epoch.pth
167
+ steps:
168
+ epochs: 10
169
+ iterations: null
170
+ lr_scheduler: epoch
171
+ test:
172
+ dataset:
173
+ test:
174
+ _target_: torch.utils.data.Dataset
175
+ dataloader:
176
+ test:
177
+ _target_: torch.utils.data.DataLoader
178
+ batch_size: 1
179
+ shuffle: false
180
+ key_mapping:
181
+ inference:
182
+ input: null
183
+ output: null
184
+ identifier: null
185
+ checkpoint: null
186
+ remove_weight_norm: null
187
+ output:
188
+ exp_dir: ./exp
189
+ inference_dir: ${.exp_dir}/inference
190
+ audio:
191
+ sample_rate: ${data.audio.sample_rate}
192
+ key_mapping:
193
+ inference:
194
+ output: null
195
+ reference: null
196
+ transforms:
197
+ inference:
198
+ output: null
199
+ reference: null
200
+ model:
201
+ _target_: birdclef2025.models.EfficientNetB0
202
+ weights: ${const:torchvision.models.EfficientNet_B0_Weights.IMAGENET1K_V1}
203
+ num_classes: ${const:birdclef2025.utils.data.birdclef.num_birdclef2025_primary_labels}
204
+ optimizer:
205
+ _target_: torch.optim.Adam
206
+ lr_scheduler: {}
207
+ criterion:
208
+ _target_: audyn.criterion.MultiCriteria
209
+ cross_entropy:
210
+ _target_: audyn.criterion.BaseCriterionWrapper
211
+ criterion:
212
+ _target_: torch.nn.CrossEntropyLoss
213
+ reduction: mean
214
+ weight: 1
215
+ key_mapping:
216
+ estimated:
217
+ input: logit
218
+ target:
219
+ target: ${train.dataloader.train.collate_fn.composer.label_index_key}
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/hydra.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ./exp/20250427-104215/log/20250427-104218
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=./exp/20250427-104215/log/20250427-104218
114
+ - hydra.mode=RUN
115
+ task:
116
+ - system=cuda
117
+ - preprocess=birdclef2025
118
+ - data=birdclef2025_5s
119
+ - train=birdclef2025_efficientnet_b0
120
+ - model=birdclef2025_efficientnet_b0
121
+ - optimizer=adam
122
+ - lr_scheduler=none
123
+ - criterion=birdclef2025_categorical_cross_entropy
124
+ - preprocess.dump_format=birdclef2025
125
+ - train.dataset.train.list_path=dump/birdclef2025_5s/list/train.txt
126
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
127
+ - train.dataset.validation.list_path=dump/birdclef2025_5s/list/validation.txt
128
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
129
+ - train.resume.continue_from=
130
+ - train.output.exp_dir=./exp/20250427-104215
131
+ - train.output.tensorboard_dir=./tensorboard/20250427-104215
132
+ job:
133
+ name: train
134
+ chdir: false
135
+ override_dirname: criterion=birdclef2025_categorical_cross_entropy,data=birdclef2025_5s,lr_scheduler=none,model=birdclef2025_efficientnet_b0,optimizer=adam,preprocess.dump_format=birdclef2025,preprocess=birdclef2025,system=cuda,train.dataset.train.feature_dir=/kaggle/input/birdclef-2025,train.dataset.train.list_path=dump/birdclef2025_5s/list/train.txt,train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025,train.dataset.validation.list_path=dump/birdclef2025_5s/list/validation.txt,train.output.exp_dir=./exp/20250427-104215,train.output.tensorboard_dir=./tensorboard/20250427-104215,train.resume.continue_from=,train=birdclef2025_efficientnet_b0
136
+ id: ???
137
+ num: ???
138
+ config_name: config
139
+ env_set: {}
140
+ env_copy: []
141
+ config:
142
+ override_dirname:
143
+ kv_sep: '='
144
+ item_sep: ','
145
+ exclude_keys: []
146
+ runtime:
147
+ version: 1.3.2
148
+ version_base: '1.2'
149
+ cwd: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0
150
+ config_sources:
151
+ - path: hydra.conf
152
+ schema: pkg
153
+ provider: hydra
154
+ - path: /usr/local/lib/python3.10/dist-packages/audyn/configs
155
+ schema: file
156
+ provider: main
157
+ - path: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/conf
158
+ schema: file
159
+ provider: command-line
160
+ - path: ''
161
+ schema: structured
162
+ provider: schema
163
+ output_dir: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218
164
+ choices:
165
+ criterion: birdclef2025_categorical_cross_entropy
166
+ lr_scheduler: none
167
+ optimizer: adam
168
+ model: birdclef2025_efficientnet_b0
169
+ test: default
170
+ test/dataloader: default
171
+ test/dataset: default
172
+ train: birdclef2025_efficientnet_b0
173
+ train/record: default
174
+ train/clip_gradient: default
175
+ train/dataloader: default
176
+ train/dataset: birdclef2025_primary-label
177
+ data: birdclef2025_5s
178
+ preprocess: birdclef2025
179
+ system: cuda
180
+ hydra/env: default
181
+ hydra/callbacks: null
182
+ hydra/job_logging: default
183
+ hydra/hydra_logging: default
184
+ hydra/hydra_help: default
185
+ hydra/help: default
186
+ hydra/sweeper: basic
187
+ hydra/launcher: basic
188
+ hydra/output: default
189
+ verbose: false
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/overrides.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - system=cuda
2
+ - preprocess=birdclef2025
3
+ - data=birdclef2025_5s
4
+ - train=birdclef2025_efficientnet_b0
5
+ - model=birdclef2025_efficientnet_b0
6
+ - optimizer=adam
7
+ - lr_scheduler=none
8
+ - criterion=birdclef2025_categorical_cross_entropy
9
+ - preprocess.dump_format=birdclef2025
10
+ - train.dataset.train.list_path=dump/birdclef2025_5s/list/train.txt
11
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
12
+ - train.dataset.validation.list_path=dump/birdclef2025_5s/list/validation.txt
13
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
14
+ - train.resume.continue_from=
15
+ - train.output.exp_dir=./exp/20250427-104215
16
+ - train.output.tensorboard_dir=./tensorboard/20250427-104215
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/.hydra/resolved_config.yaml ADDED
@@ -0,0 +1,278 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: false
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: 2
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 5
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: 32000
47
+ hop_length: 1253
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_5s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_5s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: audio
86
+ sample_rate_key: sample_rate
87
+ label_name_key: primary_label
88
+ filename_key: filename
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
98
+ melspectrogram_transform:
99
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
100
+ sample_rate: 32000
101
+ hop_length: 1253
102
+ f_min: 20
103
+ f_max: 16000
104
+ pad: 0
105
+ n_mels: 128
106
+ window_fn:
107
+ _target_: torch.hann_window
108
+ _partial_: true
109
+ power: 1.0
110
+ normalized: false
111
+ wkwargs: null
112
+ center: true
113
+ pad_mode: constant
114
+ onesided: null
115
+ norm: slaney
116
+ mel_scale: slaney
117
+ take_log: true
118
+ freq_mask_param:
119
+ - 0.06
120
+ - 0.1
121
+ time_mask_param:
122
+ - 0.06
123
+ - 0.12
124
+ eps: null
125
+ audio_key: audio
126
+ sample_rate_key: sample_rate
127
+ label_name_key: primary_label
128
+ filename_key: filename
129
+ waveform_key: waveform
130
+ melspectrogram_key: log_melspectrogram
131
+ label_index_key: label_index
132
+ sample_rate: 32000
133
+ duration: 5
134
+ decode_audio_as_waveform: true
135
+ decode_audio_as_monoral: true
136
+ training: true
137
+ melspectrogram_key: log_melspectrogram
138
+ label_index_key: label_index
139
+ alpha: 0.4
140
+ num_workers: 2
141
+ validation:
142
+ _target_: torch.utils.data.DataLoader
143
+ batch_size: 64
144
+ shuffle: false
145
+ collate_fn:
146
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
147
+ composer:
148
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
149
+ melspectrogram_transform:
150
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
151
+ sample_rate: 32000
152
+ hop_length: 1253
153
+ f_min: 20
154
+ f_max: 16000
155
+ pad: 0
156
+ n_mels: 128
157
+ window_fn:
158
+ _target_: torch.hann_window
159
+ _partial_: true
160
+ power: 1.0
161
+ normalized: false
162
+ wkwargs: null
163
+ center: true
164
+ pad_mode: constant
165
+ onesided: null
166
+ norm: slaney
167
+ mel_scale: slaney
168
+ take_log: true
169
+ freq_mask_param:
170
+ - 0.06
171
+ - 0.1
172
+ time_mask_param:
173
+ - 0.06
174
+ - 0.12
175
+ eps: null
176
+ audio_key: audio
177
+ sample_rate_key: sample_rate
178
+ label_name_key: primary_label
179
+ filename_key: filename
180
+ waveform_key: waveform
181
+ melspectrogram_key: log_melspectrogram
182
+ label_index_key: label_index
183
+ sample_rate: 32000
184
+ duration: 5
185
+ decode_audio_as_waveform: true
186
+ decode_audio_as_monoral: true
187
+ training: false
188
+ melspectrogram_key: log_melspectrogram
189
+ label_index_key: label_index
190
+ num_workers: 2
191
+ clip_gradient: {}
192
+ record: {}
193
+ trainer:
194
+ _target_: birdclef2025.utils.driver.BaseTrainer
195
+ key_mapping:
196
+ train:
197
+ input:
198
+ input: log_melspectrogram
199
+ output: logit
200
+ validation:
201
+ input:
202
+ input: log_melspectrogram
203
+ output: logit
204
+ inference:
205
+ input:
206
+ input: log_melspectrogram
207
+ output: logit
208
+ ddp_kwargs: null
209
+ resume:
210
+ continue_from: ''
211
+ output:
212
+ exp_dir: ./exp/20250427-104215
213
+ tensorboard_dir: ./tensorboard/20250427-104215
214
+ save_checkpoint:
215
+ iteration:
216
+ every: 1000
217
+ path: ./exp/20250427-104215/model/iteration{iteration}.pth
218
+ epoch:
219
+ every: 1
220
+ path: ./exp/20250427-104215/model/epoch{epoch}.pth
221
+ last:
222
+ path: ./exp/20250427-104215/model/last.pth
223
+ best_epoch:
224
+ path: ./exp/20250427-104215/model/best_epoch.pth
225
+ steps:
226
+ epochs: 10
227
+ iterations: null
228
+ lr_scheduler: epoch
229
+ test:
230
+ dataset:
231
+ test:
232
+ _target_: torch.utils.data.Dataset
233
+ dataloader:
234
+ test:
235
+ _target_: torch.utils.data.DataLoader
236
+ batch_size: 1
237
+ shuffle: false
238
+ key_mapping:
239
+ inference:
240
+ input: null
241
+ output: null
242
+ identifier: null
243
+ checkpoint: null
244
+ remove_weight_norm: null
245
+ output:
246
+ exp_dir: ./exp
247
+ inference_dir: ./exp/inference
248
+ audio:
249
+ sample_rate: 32000
250
+ key_mapping:
251
+ inference:
252
+ output: null
253
+ reference: null
254
+ transforms:
255
+ inference:
256
+ output: null
257
+ reference: null
258
+ ddp_kwargs: null
259
+ model:
260
+ _target_: birdclef2025.models.EfficientNetB0
261
+ weights: IMAGENET1K_V1
262
+ num_classes: 206
263
+ optimizer:
264
+ _target_: torch.optim.Adam
265
+ lr_scheduler: {}
266
+ criterion:
267
+ _target_: audyn.criterion.MultiCriteria
268
+ cross_entropy:
269
+ _target_: audyn.criterion.BaseCriterionWrapper
270
+ criterion:
271
+ _target_: torch.nn.CrossEntropyLoss
272
+ reduction: mean
273
+ weight: 1
274
+ key_mapping:
275
+ estimated:
276
+ input: logit
277
+ target:
278
+ target: label_index
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/log/20250427-104218/train.log ADDED
The diff for this file is too large to render. See raw diff
 
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/model/best_epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bb7d8a078a4012e5dbad69974508f0e16913dddec612232a155ee5790805be2
3
+ size 51764901
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-104215/model/last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:415711e50672e84febe12d7b656dd86d47ef46da0e9670c05bcab58a4e3b9a0d
3
+ size 51716259
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ system=default_seed-0
2
+ data=birdclef2025_15s
3
+ train=birdclef2025_efficientnet_b0
4
+ model=birdclef2025_efficientnet_b0
5
+ criterion=birdclef2025_categorical_cross_entropy
6
+
7
+ public_score: 0.476
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/config.yaml ADDED
@@ -0,0 +1,219 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: null
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: null
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: ${..audio.sample_rate}
47
+ hop_length: 1253
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: ${..train.audio_key}
86
+ sample_rate_key: ${..train.sample_rate_key}
87
+ label_name_key: ${..train.label_name_key}
88
+ filename_key: ${..train.filename_key}
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
98
+ melspectrogram_transform: ${data.melspectrogram}
99
+ audio_key: audio
100
+ sample_rate_key: sample_rate
101
+ label_name_key: primary_label
102
+ filename_key: filename
103
+ waveform_key: waveform
104
+ melspectrogram_key: log_melspectrogram
105
+ label_index_key: label_index
106
+ sample_rate: ${data.audio.sample_rate}
107
+ duration: ${data.audio.duration}
108
+ decode_audio_as_waveform: true
109
+ decode_audio_as_monoral: true
110
+ training: true
111
+ melspectrogram_key: ${.composer.melspectrogram_key}
112
+ label_index_key: ${.composer.label_index_key}
113
+ alpha: 0.4
114
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
115
+ validation:
116
+ _target_: torch.utils.data.DataLoader
117
+ batch_size: 64
118
+ shuffle: false
119
+ collate_fn:
120
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
121
+ composer:
122
+ _target_: ${....train.collate_fn.composer._target_}
123
+ melspectrogram_transform: ${....train.collate_fn.composer.melspectrogram_transform}
124
+ audio_key: ${....train.collate_fn.composer.audio_key}
125
+ sample_rate_key: ${....train.collate_fn.composer.sample_rate_key}
126
+ label_name_key: ${....train.collate_fn.composer.label_name_key}
127
+ filename_key: ${....train.collate_fn.composer.filename_key}
128
+ waveform_key: ${....train.collate_fn.composer.waveform_key}
129
+ melspectrogram_key: ${....train.collate_fn.composer.melspectrogram_key}
130
+ label_index_key: ${....train.collate_fn.composer.label_index_key}
131
+ sample_rate: ${....train.collate_fn.composer.sample_rate}
132
+ duration: ${....train.collate_fn.composer.duration}
133
+ decode_audio_as_waveform: ${....train.collate_fn.composer.decode_audio_as_waveform}
134
+ decode_audio_as_monoral: ${....train.collate_fn.composer.decode_audio_as_monoral}
135
+ training: false
136
+ melspectrogram_key: ${...train.collate_fn.composer.melspectrogram_key}
137
+ label_index_key: ${...train.collate_fn.composer.label_index_key}
138
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
139
+ clip_gradient: {}
140
+ record: {}
141
+ trainer:
142
+ _target_: birdclef2025.utils.driver.BaseTrainer
143
+ key_mapping:
144
+ train:
145
+ input:
146
+ input: ${....dataloader.train.collate_fn.composer.melspectrogram_key}
147
+ output: logit
148
+ validation: ${.train}
149
+ inference: ${.validation}
150
+ ddp_kwargs: null
151
+ resume:
152
+ continue_from: ''
153
+ output:
154
+ exp_dir: ./exp/20250427-115144
155
+ tensorboard_dir: ./tensorboard/20250427-115144
156
+ save_checkpoint:
157
+ iteration:
158
+ every: 1000
159
+ path: ${...exp_dir}/model/iteration{iteration}.pth
160
+ epoch:
161
+ every: 1
162
+ path: ${...exp_dir}/model/epoch{epoch}.pth
163
+ last:
164
+ path: ${...exp_dir}/model/last.pth
165
+ best_epoch:
166
+ path: ${...exp_dir}/model/best_epoch.pth
167
+ steps:
168
+ epochs: 10
169
+ iterations: null
170
+ lr_scheduler: epoch
171
+ test:
172
+ dataset:
173
+ test:
174
+ _target_: torch.utils.data.Dataset
175
+ dataloader:
176
+ test:
177
+ _target_: torch.utils.data.DataLoader
178
+ batch_size: 1
179
+ shuffle: false
180
+ key_mapping:
181
+ inference:
182
+ input: null
183
+ output: null
184
+ identifier: null
185
+ checkpoint: null
186
+ remove_weight_norm: null
187
+ output:
188
+ exp_dir: ./exp
189
+ inference_dir: ${.exp_dir}/inference
190
+ audio:
191
+ sample_rate: ${data.audio.sample_rate}
192
+ key_mapping:
193
+ inference:
194
+ output: null
195
+ reference: null
196
+ transforms:
197
+ inference:
198
+ output: null
199
+ reference: null
200
+ model:
201
+ _target_: birdclef2025.models.EfficientNetB0
202
+ weights: ${const:torchvision.models.EfficientNet_B0_Weights.IMAGENET1K_V1}
203
+ num_classes: ${const:birdclef2025.utils.data.birdclef.num_birdclef2025_primary_labels}
204
+ optimizer:
205
+ _target_: torch.optim.Adam
206
+ lr_scheduler: {}
207
+ criterion:
208
+ _target_: audyn.criterion.MultiCriteria
209
+ cross_entropy:
210
+ _target_: audyn.criterion.BaseCriterionWrapper
211
+ criterion:
212
+ _target_: torch.nn.CrossEntropyLoss
213
+ reduction: mean
214
+ weight: 1
215
+ key_mapping:
216
+ estimated:
217
+ input: logit
218
+ target:
219
+ target: ${train.dataloader.train.collate_fn.composer.label_index_key}
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/hydra.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ./exp/20250427-115144/log/20250427-115147
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=./exp/20250427-115144/log/20250427-115147
114
+ - hydra.mode=RUN
115
+ task:
116
+ - system=cuda
117
+ - preprocess=birdclef2025
118
+ - data=birdclef2025_15s
119
+ - train=birdclef2025_efficientnet_b0
120
+ - model=birdclef2025_efficientnet_b0
121
+ - optimizer=adam
122
+ - lr_scheduler=none
123
+ - criterion=birdclef2025_categorical_cross_entropy
124
+ - preprocess.dump_format=birdclef2025
125
+ - train.dataset.train.list_path=dump/birdclef2025_15s/list/train.txt
126
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
127
+ - train.dataset.validation.list_path=dump/birdclef2025_15s/list/validation.txt
128
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
129
+ - train.resume.continue_from=
130
+ - train.output.exp_dir=./exp/20250427-115144
131
+ - train.output.tensorboard_dir=./tensorboard/20250427-115144
132
+ job:
133
+ name: train
134
+ chdir: false
135
+ override_dirname: criterion=birdclef2025_categorical_cross_entropy,data=birdclef2025_15s,lr_scheduler=none,model=birdclef2025_efficientnet_b0,optimizer=adam,preprocess.dump_format=birdclef2025,preprocess=birdclef2025,system=cuda,train.dataset.train.feature_dir=/kaggle/input/birdclef-2025,train.dataset.train.list_path=dump/birdclef2025_15s/list/train.txt,train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025,train.dataset.validation.list_path=dump/birdclef2025_15s/list/validation.txt,train.output.exp_dir=./exp/20250427-115144,train.output.tensorboard_dir=./tensorboard/20250427-115144,train.resume.continue_from=,train=birdclef2025_efficientnet_b0
136
+ id: ???
137
+ num: ???
138
+ config_name: config
139
+ env_set: {}
140
+ env_copy: []
141
+ config:
142
+ override_dirname:
143
+ kv_sep: '='
144
+ item_sep: ','
145
+ exclude_keys: []
146
+ runtime:
147
+ version: 1.3.2
148
+ version_base: '1.2'
149
+ cwd: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0
150
+ config_sources:
151
+ - path: hydra.conf
152
+ schema: pkg
153
+ provider: hydra
154
+ - path: /usr/local/lib/python3.10/dist-packages/audyn/configs
155
+ schema: file
156
+ provider: main
157
+ - path: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/conf
158
+ schema: file
159
+ provider: command-line
160
+ - path: ''
161
+ schema: structured
162
+ provider: schema
163
+ output_dir: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147
164
+ choices:
165
+ criterion: birdclef2025_categorical_cross_entropy
166
+ lr_scheduler: none
167
+ optimizer: adam
168
+ model: birdclef2025_efficientnet_b0
169
+ test: default
170
+ test/dataloader: default
171
+ test/dataset: default
172
+ train: birdclef2025_efficientnet_b0
173
+ train/record: default
174
+ train/clip_gradient: default
175
+ train/dataloader: default
176
+ train/dataset: birdclef2025_primary-label
177
+ data: birdclef2025_15s
178
+ preprocess: birdclef2025
179
+ system: cuda
180
+ hydra/env: default
181
+ hydra/callbacks: null
182
+ hydra/job_logging: default
183
+ hydra/hydra_logging: default
184
+ hydra/hydra_help: default
185
+ hydra/help: default
186
+ hydra/sweeper: basic
187
+ hydra/launcher: basic
188
+ hydra/output: default
189
+ verbose: false
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/overrides.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - system=cuda
2
+ - preprocess=birdclef2025
3
+ - data=birdclef2025_15s
4
+ - train=birdclef2025_efficientnet_b0
5
+ - model=birdclef2025_efficientnet_b0
6
+ - optimizer=adam
7
+ - lr_scheduler=none
8
+ - criterion=birdclef2025_categorical_cross_entropy
9
+ - preprocess.dump_format=birdclef2025
10
+ - train.dataset.train.list_path=dump/birdclef2025_15s/list/train.txt
11
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
12
+ - train.dataset.validation.list_path=dump/birdclef2025_15s/list/validation.txt
13
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
14
+ - train.resume.continue_from=
15
+ - train.output.exp_dir=./exp/20250427-115144
16
+ - train.output.tensorboard_dir=./tensorboard/20250427-115144
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/.hydra/resolved_config.yaml ADDED
@@ -0,0 +1,278 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: false
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: 2
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: 32000
47
+ hop_length: 1253
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: audio
86
+ sample_rate_key: sample_rate
87
+ label_name_key: primary_label
88
+ filename_key: filename
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
98
+ melspectrogram_transform:
99
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
100
+ sample_rate: 32000
101
+ hop_length: 1253
102
+ f_min: 20
103
+ f_max: 16000
104
+ pad: 0
105
+ n_mels: 128
106
+ window_fn:
107
+ _target_: torch.hann_window
108
+ _partial_: true
109
+ power: 1.0
110
+ normalized: false
111
+ wkwargs: null
112
+ center: true
113
+ pad_mode: constant
114
+ onesided: null
115
+ norm: slaney
116
+ mel_scale: slaney
117
+ take_log: true
118
+ freq_mask_param:
119
+ - 0.06
120
+ - 0.1
121
+ time_mask_param:
122
+ - 0.06
123
+ - 0.12
124
+ eps: null
125
+ audio_key: audio
126
+ sample_rate_key: sample_rate
127
+ label_name_key: primary_label
128
+ filename_key: filename
129
+ waveform_key: waveform
130
+ melspectrogram_key: log_melspectrogram
131
+ label_index_key: label_index
132
+ sample_rate: 32000
133
+ duration: 15
134
+ decode_audio_as_waveform: true
135
+ decode_audio_as_monoral: true
136
+ training: true
137
+ melspectrogram_key: log_melspectrogram
138
+ label_index_key: label_index
139
+ alpha: 0.4
140
+ num_workers: 2
141
+ validation:
142
+ _target_: torch.utils.data.DataLoader
143
+ batch_size: 64
144
+ shuffle: false
145
+ collate_fn:
146
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
147
+ composer:
148
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelComposer
149
+ melspectrogram_transform:
150
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
151
+ sample_rate: 32000
152
+ hop_length: 1253
153
+ f_min: 20
154
+ f_max: 16000
155
+ pad: 0
156
+ n_mels: 128
157
+ window_fn:
158
+ _target_: torch.hann_window
159
+ _partial_: true
160
+ power: 1.0
161
+ normalized: false
162
+ wkwargs: null
163
+ center: true
164
+ pad_mode: constant
165
+ onesided: null
166
+ norm: slaney
167
+ mel_scale: slaney
168
+ take_log: true
169
+ freq_mask_param:
170
+ - 0.06
171
+ - 0.1
172
+ time_mask_param:
173
+ - 0.06
174
+ - 0.12
175
+ eps: null
176
+ audio_key: audio
177
+ sample_rate_key: sample_rate
178
+ label_name_key: primary_label
179
+ filename_key: filename
180
+ waveform_key: waveform
181
+ melspectrogram_key: log_melspectrogram
182
+ label_index_key: label_index
183
+ sample_rate: 32000
184
+ duration: 15
185
+ decode_audio_as_waveform: true
186
+ decode_audio_as_monoral: true
187
+ training: false
188
+ melspectrogram_key: log_melspectrogram
189
+ label_index_key: label_index
190
+ num_workers: 2
191
+ clip_gradient: {}
192
+ record: {}
193
+ trainer:
194
+ _target_: birdclef2025.utils.driver.BaseTrainer
195
+ key_mapping:
196
+ train:
197
+ input:
198
+ input: log_melspectrogram
199
+ output: logit
200
+ validation:
201
+ input:
202
+ input: log_melspectrogram
203
+ output: logit
204
+ inference:
205
+ input:
206
+ input: log_melspectrogram
207
+ output: logit
208
+ ddp_kwargs: null
209
+ resume:
210
+ continue_from: ''
211
+ output:
212
+ exp_dir: ./exp/20250427-115144
213
+ tensorboard_dir: ./tensorboard/20250427-115144
214
+ save_checkpoint:
215
+ iteration:
216
+ every: 1000
217
+ path: ./exp/20250427-115144/model/iteration{iteration}.pth
218
+ epoch:
219
+ every: 1
220
+ path: ./exp/20250427-115144/model/epoch{epoch}.pth
221
+ last:
222
+ path: ./exp/20250427-115144/model/last.pth
223
+ best_epoch:
224
+ path: ./exp/20250427-115144/model/best_epoch.pth
225
+ steps:
226
+ epochs: 10
227
+ iterations: null
228
+ lr_scheduler: epoch
229
+ test:
230
+ dataset:
231
+ test:
232
+ _target_: torch.utils.data.Dataset
233
+ dataloader:
234
+ test:
235
+ _target_: torch.utils.data.DataLoader
236
+ batch_size: 1
237
+ shuffle: false
238
+ key_mapping:
239
+ inference:
240
+ input: null
241
+ output: null
242
+ identifier: null
243
+ checkpoint: null
244
+ remove_weight_norm: null
245
+ output:
246
+ exp_dir: ./exp
247
+ inference_dir: ./exp/inference
248
+ audio:
249
+ sample_rate: 32000
250
+ key_mapping:
251
+ inference:
252
+ output: null
253
+ reference: null
254
+ transforms:
255
+ inference:
256
+ output: null
257
+ reference: null
258
+ ddp_kwargs: null
259
+ model:
260
+ _target_: birdclef2025.models.EfficientNetB0
261
+ weights: IMAGENET1K_V1
262
+ num_classes: 206
263
+ optimizer:
264
+ _target_: torch.optim.Adam
265
+ lr_scheduler: {}
266
+ criterion:
267
+ _target_: audyn.criterion.MultiCriteria
268
+ cross_entropy:
269
+ _target_: audyn.criterion.BaseCriterionWrapper
270
+ criterion:
271
+ _target_: torch.nn.CrossEntropyLoss
272
+ reduction: mean
273
+ weight: 1
274
+ key_mapping:
275
+ estimated:
276
+ input: logit
277
+ target:
278
+ target: label_index
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/log/20250427-115147/train.log ADDED
The diff for this file is too large to render. See raw diff
 
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/model/best_epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:887a11993732bc610e1fe1aba1f139ce608e5989ddba7e63575376045cab0511
3
+ size 51764901
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-115144/model/last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4362e841a15c2fb999d73eb4ff6e50b84e2f5ea8822fa594771eab4043fa1d4
3
+ size 51716259
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ system=default_seed-0
2
+ data=birdclef2025_reshape_15s
3
+ train=birdclef2025_reshape_efficientnet_b0
4
+ model=birdclef2025_efficientnet_b0
5
+ criterion=birdclef2025_categorical_cross_entropy
6
+
7
+ public_score: 0.519
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/config.yaml ADDED
@@ -0,0 +1,221 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: null
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: null
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: ${..audio.sample_rate}
47
+ hop_length: 512
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_reshape_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_reshape_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: ${..train.audio_key}
86
+ sample_rate_key: ${..train.sample_rate_key}
87
+ label_name_key: ${..train.label_name_key}
88
+ filename_key: ${..train.filename_key}
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
98
+ melspectrogram_transform: ${data.melspectrogram}
99
+ audio_key: audio
100
+ sample_rate_key: sample_rate
101
+ label_name_key: primary_label
102
+ filename_key: filename
103
+ waveform_key: waveform
104
+ melspectrogram_key: log_melspectrogram
105
+ label_index_key: label_index
106
+ sample_rate: ${data.audio.sample_rate}
107
+ duration: ${data.audio.duration}
108
+ decode_audio_as_waveform: true
109
+ decode_audio_as_monoral: true
110
+ training: true
111
+ target_shape: 256
112
+ melspectrogram_key: ${.composer.melspectrogram_key}
113
+ label_index_key: ${.composer.label_index_key}
114
+ alpha: 0.4
115
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
116
+ validation:
117
+ _target_: torch.utils.data.DataLoader
118
+ batch_size: 64
119
+ shuffle: false
120
+ collate_fn:
121
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
122
+ composer:
123
+ _target_: ${....train.collate_fn.composer._target_}
124
+ melspectrogram_transform: ${....train.collate_fn.composer.melspectrogram_transform}
125
+ audio_key: ${....train.collate_fn.composer.audio_key}
126
+ sample_rate_key: ${....train.collate_fn.composer.sample_rate_key}
127
+ label_name_key: ${....train.collate_fn.composer.label_name_key}
128
+ filename_key: ${....train.collate_fn.composer.filename_key}
129
+ waveform_key: ${....train.collate_fn.composer.waveform_key}
130
+ melspectrogram_key: ${....train.collate_fn.composer.melspectrogram_key}
131
+ label_index_key: ${....train.collate_fn.composer.label_index_key}
132
+ sample_rate: ${....train.collate_fn.composer.sample_rate}
133
+ duration: ${....train.collate_fn.composer.duration}
134
+ decode_audio_as_waveform: ${....train.collate_fn.composer.decode_audio_as_waveform}
135
+ decode_audio_as_monoral: ${....train.collate_fn.composer.decode_audio_as_monoral}
136
+ training: false
137
+ target_shape: ${....train.collate_fn.composer.target_shape}
138
+ melspectrogram_key: ${...train.collate_fn.composer.melspectrogram_key}
139
+ label_index_key: ${...train.collate_fn.composer.label_index_key}
140
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
141
+ clip_gradient: {}
142
+ record: {}
143
+ trainer:
144
+ _target_: birdclef2025.utils.driver.BaseTrainer
145
+ key_mapping:
146
+ train:
147
+ input:
148
+ input: ${....dataloader.train.collate_fn.composer.melspectrogram_key}
149
+ output: logit
150
+ validation: ${.train}
151
+ inference: ${.validation}
152
+ ddp_kwargs: null
153
+ resume:
154
+ continue_from: ''
155
+ output:
156
+ exp_dir: ./exp/20250427-133045
157
+ tensorboard_dir: ./tensorboard/20250427-133045
158
+ save_checkpoint:
159
+ iteration:
160
+ every: 1000
161
+ path: ${...exp_dir}/model/iteration{iteration}.pth
162
+ epoch:
163
+ every: 1
164
+ path: ${...exp_dir}/model/epoch{epoch}.pth
165
+ last:
166
+ path: ${...exp_dir}/model/last.pth
167
+ best_epoch:
168
+ path: ${...exp_dir}/model/best_epoch.pth
169
+ steps:
170
+ epochs: 10
171
+ iterations: null
172
+ lr_scheduler: epoch
173
+ test:
174
+ dataset:
175
+ test:
176
+ _target_: torch.utils.data.Dataset
177
+ dataloader:
178
+ test:
179
+ _target_: torch.utils.data.DataLoader
180
+ batch_size: 1
181
+ shuffle: false
182
+ key_mapping:
183
+ inference:
184
+ input: null
185
+ output: null
186
+ identifier: null
187
+ checkpoint: null
188
+ remove_weight_norm: null
189
+ output:
190
+ exp_dir: ./exp
191
+ inference_dir: ${.exp_dir}/inference
192
+ audio:
193
+ sample_rate: ${data.audio.sample_rate}
194
+ key_mapping:
195
+ inference:
196
+ output: null
197
+ reference: null
198
+ transforms:
199
+ inference:
200
+ output: null
201
+ reference: null
202
+ model:
203
+ _target_: birdclef2025.models.EfficientNetB0
204
+ weights: ${const:torchvision.models.EfficientNet_B0_Weights.IMAGENET1K_V1}
205
+ num_classes: ${const:birdclef2025.utils.data.birdclef.num_birdclef2025_primary_labels}
206
+ optimizer:
207
+ _target_: torch.optim.Adam
208
+ lr_scheduler: {}
209
+ criterion:
210
+ _target_: audyn.criterion.MultiCriteria
211
+ cross_entropy:
212
+ _target_: audyn.criterion.BaseCriterionWrapper
213
+ criterion:
214
+ _target_: torch.nn.CrossEntropyLoss
215
+ reduction: mean
216
+ weight: 1
217
+ key_mapping:
218
+ estimated:
219
+ input: logit
220
+ target:
221
+ target: ${train.dataloader.train.collate_fn.composer.label_index_key}
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/hydra.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ./exp/20250427-133045/log/20250427-133047
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=./exp/20250427-133045/log/20250427-133047
114
+ - hydra.mode=RUN
115
+ task:
116
+ - system=cuda
117
+ - preprocess=birdclef2025
118
+ - data=birdclef2025_reshape_15s
119
+ - train=birdclef2025_reshape_efficientnet_b0
120
+ - model=birdclef2025_efficientnet_b0
121
+ - optimizer=adam
122
+ - lr_scheduler=none
123
+ - criterion=birdclef2025_categorical_cross_entropy
124
+ - preprocess.dump_format=birdclef2025
125
+ - train.dataset.train.list_path=dump/birdclef2025_reshape_15s/list/train.txt
126
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
127
+ - train.dataset.validation.list_path=dump/birdclef2025_reshape_15s/list/validation.txt
128
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
129
+ - train.resume.continue_from=
130
+ - train.output.exp_dir=./exp/20250427-133045
131
+ - train.output.tensorboard_dir=./tensorboard/20250427-133045
132
+ job:
133
+ name: train
134
+ chdir: false
135
+ override_dirname: criterion=birdclef2025_categorical_cross_entropy,data=birdclef2025_reshape_15s,lr_scheduler=none,model=birdclef2025_efficientnet_b0,optimizer=adam,preprocess.dump_format=birdclef2025,preprocess=birdclef2025,system=cuda,train.dataset.train.feature_dir=/kaggle/input/birdclef-2025,train.dataset.train.list_path=dump/birdclef2025_reshape_15s/list/train.txt,train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025,train.dataset.validation.list_path=dump/birdclef2025_reshape_15s/list/validation.txt,train.output.exp_dir=./exp/20250427-133045,train.output.tensorboard_dir=./tensorboard/20250427-133045,train.resume.continue_from=,train=birdclef2025_reshape_efficientnet_b0
136
+ id: ???
137
+ num: ???
138
+ config_name: config
139
+ env_set: {}
140
+ env_copy: []
141
+ config:
142
+ override_dirname:
143
+ kv_sep: '='
144
+ item_sep: ','
145
+ exclude_keys: []
146
+ runtime:
147
+ version: 1.3.2
148
+ version_base: '1.2'
149
+ cwd: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0
150
+ config_sources:
151
+ - path: hydra.conf
152
+ schema: pkg
153
+ provider: hydra
154
+ - path: /usr/local/lib/python3.10/dist-packages/audyn/configs
155
+ schema: file
156
+ provider: main
157
+ - path: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/conf
158
+ schema: file
159
+ provider: command-line
160
+ - path: ''
161
+ schema: structured
162
+ provider: schema
163
+ output_dir: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047
164
+ choices:
165
+ criterion: birdclef2025_categorical_cross_entropy
166
+ lr_scheduler: none
167
+ optimizer: adam
168
+ model: birdclef2025_efficientnet_b0
169
+ test: default
170
+ test/dataloader: default
171
+ test/dataset: default
172
+ train: birdclef2025_reshape_efficientnet_b0
173
+ train/record: default
174
+ train/clip_gradient: default
175
+ train/dataloader: default
176
+ train/dataset: birdclef2025_primary-label
177
+ data: birdclef2025_reshape_15s
178
+ preprocess: birdclef2025
179
+ system: cuda
180
+ hydra/env: default
181
+ hydra/callbacks: null
182
+ hydra/job_logging: default
183
+ hydra/hydra_logging: default
184
+ hydra/hydra_help: default
185
+ hydra/help: default
186
+ hydra/sweeper: basic
187
+ hydra/launcher: basic
188
+ hydra/output: default
189
+ verbose: false
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/overrides.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - system=cuda
2
+ - preprocess=birdclef2025
3
+ - data=birdclef2025_reshape_15s
4
+ - train=birdclef2025_reshape_efficientnet_b0
5
+ - model=birdclef2025_efficientnet_b0
6
+ - optimizer=adam
7
+ - lr_scheduler=none
8
+ - criterion=birdclef2025_categorical_cross_entropy
9
+ - preprocess.dump_format=birdclef2025
10
+ - train.dataset.train.list_path=dump/birdclef2025_reshape_15s/list/train.txt
11
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
12
+ - train.dataset.validation.list_path=dump/birdclef2025_reshape_15s/list/validation.txt
13
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
14
+ - train.resume.continue_from=
15
+ - train.output.exp_dir=./exp/20250427-133045
16
+ - train.output.tensorboard_dir=./tensorboard/20250427-133045
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/.hydra/resolved_config.yaml ADDED
@@ -0,0 +1,280 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: false
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: 2
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 15
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: 32000
47
+ hop_length: 512
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_reshape_15s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_reshape_15s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: audio
86
+ sample_rate_key: sample_rate
87
+ label_name_key: primary_label
88
+ filename_key: filename
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
98
+ melspectrogram_transform:
99
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
100
+ sample_rate: 32000
101
+ hop_length: 512
102
+ f_min: 20
103
+ f_max: 16000
104
+ pad: 0
105
+ n_mels: 128
106
+ window_fn:
107
+ _target_: torch.hann_window
108
+ _partial_: true
109
+ power: 1.0
110
+ normalized: false
111
+ wkwargs: null
112
+ center: true
113
+ pad_mode: constant
114
+ onesided: null
115
+ norm: slaney
116
+ mel_scale: slaney
117
+ take_log: true
118
+ freq_mask_param:
119
+ - 0.06
120
+ - 0.1
121
+ time_mask_param:
122
+ - 0.06
123
+ - 0.12
124
+ eps: null
125
+ audio_key: audio
126
+ sample_rate_key: sample_rate
127
+ label_name_key: primary_label
128
+ filename_key: filename
129
+ waveform_key: waveform
130
+ melspectrogram_key: log_melspectrogram
131
+ label_index_key: label_index
132
+ sample_rate: 32000
133
+ duration: 15
134
+ decode_audio_as_waveform: true
135
+ decode_audio_as_monoral: true
136
+ training: true
137
+ target_shape: 256
138
+ melspectrogram_key: log_melspectrogram
139
+ label_index_key: label_index
140
+ alpha: 0.4
141
+ num_workers: 2
142
+ validation:
143
+ _target_: torch.utils.data.DataLoader
144
+ batch_size: 64
145
+ shuffle: false
146
+ collate_fn:
147
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
148
+ composer:
149
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
150
+ melspectrogram_transform:
151
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
152
+ sample_rate: 32000
153
+ hop_length: 512
154
+ f_min: 20
155
+ f_max: 16000
156
+ pad: 0
157
+ n_mels: 128
158
+ window_fn:
159
+ _target_: torch.hann_window
160
+ _partial_: true
161
+ power: 1.0
162
+ normalized: false
163
+ wkwargs: null
164
+ center: true
165
+ pad_mode: constant
166
+ onesided: null
167
+ norm: slaney
168
+ mel_scale: slaney
169
+ take_log: true
170
+ freq_mask_param:
171
+ - 0.06
172
+ - 0.1
173
+ time_mask_param:
174
+ - 0.06
175
+ - 0.12
176
+ eps: null
177
+ audio_key: audio
178
+ sample_rate_key: sample_rate
179
+ label_name_key: primary_label
180
+ filename_key: filename
181
+ waveform_key: waveform
182
+ melspectrogram_key: log_melspectrogram
183
+ label_index_key: label_index
184
+ sample_rate: 32000
185
+ duration: 15
186
+ decode_audio_as_waveform: true
187
+ decode_audio_as_monoral: true
188
+ training: false
189
+ target_shape: 256
190
+ melspectrogram_key: log_melspectrogram
191
+ label_index_key: label_index
192
+ num_workers: 2
193
+ clip_gradient: {}
194
+ record: {}
195
+ trainer:
196
+ _target_: birdclef2025.utils.driver.BaseTrainer
197
+ key_mapping:
198
+ train:
199
+ input:
200
+ input: log_melspectrogram
201
+ output: logit
202
+ validation:
203
+ input:
204
+ input: log_melspectrogram
205
+ output: logit
206
+ inference:
207
+ input:
208
+ input: log_melspectrogram
209
+ output: logit
210
+ ddp_kwargs: null
211
+ resume:
212
+ continue_from: ''
213
+ output:
214
+ exp_dir: ./exp/20250427-133045
215
+ tensorboard_dir: ./tensorboard/20250427-133045
216
+ save_checkpoint:
217
+ iteration:
218
+ every: 1000
219
+ path: ./exp/20250427-133045/model/iteration{iteration}.pth
220
+ epoch:
221
+ every: 1
222
+ path: ./exp/20250427-133045/model/epoch{epoch}.pth
223
+ last:
224
+ path: ./exp/20250427-133045/model/last.pth
225
+ best_epoch:
226
+ path: ./exp/20250427-133045/model/best_epoch.pth
227
+ steps:
228
+ epochs: 10
229
+ iterations: null
230
+ lr_scheduler: epoch
231
+ test:
232
+ dataset:
233
+ test:
234
+ _target_: torch.utils.data.Dataset
235
+ dataloader:
236
+ test:
237
+ _target_: torch.utils.data.DataLoader
238
+ batch_size: 1
239
+ shuffle: false
240
+ key_mapping:
241
+ inference:
242
+ input: null
243
+ output: null
244
+ identifier: null
245
+ checkpoint: null
246
+ remove_weight_norm: null
247
+ output:
248
+ exp_dir: ./exp
249
+ inference_dir: ./exp/inference
250
+ audio:
251
+ sample_rate: 32000
252
+ key_mapping:
253
+ inference:
254
+ output: null
255
+ reference: null
256
+ transforms:
257
+ inference:
258
+ output: null
259
+ reference: null
260
+ ddp_kwargs: null
261
+ model:
262
+ _target_: birdclef2025.models.EfficientNetB0
263
+ weights: IMAGENET1K_V1
264
+ num_classes: 206
265
+ optimizer:
266
+ _target_: torch.optim.Adam
267
+ lr_scheduler: {}
268
+ criterion:
269
+ _target_: audyn.criterion.MultiCriteria
270
+ cross_entropy:
271
+ _target_: audyn.criterion.BaseCriterionWrapper
272
+ criterion:
273
+ _target_: torch.nn.CrossEntropyLoss
274
+ reduction: mean
275
+ weight: 1
276
+ key_mapping:
277
+ estimated:
278
+ input: logit
279
+ target:
280
+ target: label_index
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/log/20250427-133047/train.log ADDED
The diff for this file is too large to render. See raw diff
 
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/model/best_epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dc01e358d6c9cdfe0d88db0cdef138aca9756e3751f8114a599b1a6f82f8ca3
3
+ size 51764965
recipes/BirdCLEF2025/EfficientNetB0/exp/20250427-133045/model/last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab04bd9340de85728e8187eb6f92a7cd4fcc59c6492344fd410665968890aa90
3
+ size 51716323
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ system=default_seed-0
2
+ data=birdclef2025_reshape_5s
3
+ train=birdclef2025_reshape_efficientnet_b0
4
+ model=birdclef2025_efficientnet_b0
5
+ criterion=birdclef2025_categorical_cross_entropy
6
+
7
+ public_score: 0.490
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/config.yaml ADDED
@@ -0,0 +1,221 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: null
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: null
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 5
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: ${..audio.sample_rate}
47
+ hop_length: 512
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_reshape_5s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_reshape_5s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: ${..train.audio_key}
86
+ sample_rate_key: ${..train.sample_rate_key}
87
+ label_name_key: ${..train.label_name_key}
88
+ filename_key: ${..train.filename_key}
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
98
+ melspectrogram_transform: ${data.melspectrogram}
99
+ audio_key: audio
100
+ sample_rate_key: sample_rate
101
+ label_name_key: primary_label
102
+ filename_key: filename
103
+ waveform_key: waveform
104
+ melspectrogram_key: log_melspectrogram
105
+ label_index_key: label_index
106
+ sample_rate: ${data.audio.sample_rate}
107
+ duration: ${data.audio.duration}
108
+ decode_audio_as_waveform: true
109
+ decode_audio_as_monoral: true
110
+ training: true
111
+ target_shape: 256
112
+ melspectrogram_key: ${.composer.melspectrogram_key}
113
+ label_index_key: ${.composer.label_index_key}
114
+ alpha: 0.4
115
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
116
+ validation:
117
+ _target_: torch.utils.data.DataLoader
118
+ batch_size: 64
119
+ shuffle: false
120
+ collate_fn:
121
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
122
+ composer:
123
+ _target_: ${....train.collate_fn.composer._target_}
124
+ melspectrogram_transform: ${....train.collate_fn.composer.melspectrogram_transform}
125
+ audio_key: ${....train.collate_fn.composer.audio_key}
126
+ sample_rate_key: ${....train.collate_fn.composer.sample_rate_key}
127
+ label_name_key: ${....train.collate_fn.composer.label_name_key}
128
+ filename_key: ${....train.collate_fn.composer.filename_key}
129
+ waveform_key: ${....train.collate_fn.composer.waveform_key}
130
+ melspectrogram_key: ${....train.collate_fn.composer.melspectrogram_key}
131
+ label_index_key: ${....train.collate_fn.composer.label_index_key}
132
+ sample_rate: ${....train.collate_fn.composer.sample_rate}
133
+ duration: ${....train.collate_fn.composer.duration}
134
+ decode_audio_as_waveform: ${....train.collate_fn.composer.decode_audio_as_waveform}
135
+ decode_audio_as_monoral: ${....train.collate_fn.composer.decode_audio_as_monoral}
136
+ training: false
137
+ target_shape: ${....train.collate_fn.composer.target_shape}
138
+ melspectrogram_key: ${...train.collate_fn.composer.melspectrogram_key}
139
+ label_index_key: ${...train.collate_fn.composer.label_index_key}
140
+ num_workers: ${const:birdclef2025.utils.data.default_num_workers}
141
+ clip_gradient: {}
142
+ record: {}
143
+ trainer:
144
+ _target_: birdclef2025.utils.driver.BaseTrainer
145
+ key_mapping:
146
+ train:
147
+ input:
148
+ input: ${....dataloader.train.collate_fn.composer.melspectrogram_key}
149
+ output: logit
150
+ validation: ${.train}
151
+ inference: ${.validation}
152
+ ddp_kwargs: null
153
+ resume:
154
+ continue_from: ''
155
+ output:
156
+ exp_dir: ./exp/20250428-032422
157
+ tensorboard_dir: ./tensorboard/20250428-032422
158
+ save_checkpoint:
159
+ iteration:
160
+ every: 1000
161
+ path: ${...exp_dir}/model/iteration{iteration}.pth
162
+ epoch:
163
+ every: 1
164
+ path: ${...exp_dir}/model/epoch{epoch}.pth
165
+ last:
166
+ path: ${...exp_dir}/model/last.pth
167
+ best_epoch:
168
+ path: ${...exp_dir}/model/best_epoch.pth
169
+ steps:
170
+ epochs: 10
171
+ iterations: null
172
+ lr_scheduler: epoch
173
+ test:
174
+ dataset:
175
+ test:
176
+ _target_: torch.utils.data.Dataset
177
+ dataloader:
178
+ test:
179
+ _target_: torch.utils.data.DataLoader
180
+ batch_size: 1
181
+ shuffle: false
182
+ key_mapping:
183
+ inference:
184
+ input: null
185
+ output: null
186
+ identifier: null
187
+ checkpoint: null
188
+ remove_weight_norm: null
189
+ output:
190
+ exp_dir: ./exp
191
+ inference_dir: ${.exp_dir}/inference
192
+ audio:
193
+ sample_rate: ${data.audio.sample_rate}
194
+ key_mapping:
195
+ inference:
196
+ output: null
197
+ reference: null
198
+ transforms:
199
+ inference:
200
+ output: null
201
+ reference: null
202
+ model:
203
+ _target_: birdclef2025.models.EfficientNetB0
204
+ weights: ${const:torchvision.models.EfficientNet_B0_Weights.IMAGENET1K_V1}
205
+ num_classes: ${const:birdclef2025.utils.data.birdclef.num_birdclef2025_primary_labels}
206
+ optimizer:
207
+ _target_: torch.optim.Adam
208
+ lr_scheduler: {}
209
+ criterion:
210
+ _target_: audyn.criterion.MultiCriteria
211
+ cross_entropy:
212
+ _target_: audyn.criterion.BaseCriterionWrapper
213
+ criterion:
214
+ _target_: torch.nn.CrossEntropyLoss
215
+ reduction: mean
216
+ weight: 1
217
+ key_mapping:
218
+ estimated:
219
+ input: logit
220
+ target:
221
+ target: ${train.dataloader.train.collate_fn.composer.label_index_key}
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/hydra.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ./exp/20250428-032422/log/20250428-032425
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=./exp/20250428-032422/log/20250428-032425
114
+ - hydra.mode=RUN
115
+ task:
116
+ - system=cuda
117
+ - preprocess=birdclef2025
118
+ - data=birdclef2025_reshape_5s
119
+ - train=birdclef2025_reshape_efficientnet_b0
120
+ - model=birdclef2025_efficientnet_b0
121
+ - optimizer=adam
122
+ - lr_scheduler=none
123
+ - criterion=birdclef2025_categorical_cross_entropy
124
+ - preprocess.dump_format=birdclef2025
125
+ - train.dataset.train.list_path=dump/birdclef2025_reshape_5s/list/train.txt
126
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
127
+ - train.dataset.validation.list_path=dump/birdclef2025_reshape_5s/list/validation.txt
128
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
129
+ - train.resume.continue_from=
130
+ - train.output.exp_dir=./exp/20250428-032422
131
+ - train.output.tensorboard_dir=./tensorboard/20250428-032422
132
+ job:
133
+ name: train
134
+ chdir: false
135
+ override_dirname: criterion=birdclef2025_categorical_cross_entropy,data=birdclef2025_reshape_5s,lr_scheduler=none,model=birdclef2025_efficientnet_b0,optimizer=adam,preprocess.dump_format=birdclef2025,preprocess=birdclef2025,system=cuda,train.dataset.train.feature_dir=/kaggle/input/birdclef-2025,train.dataset.train.list_path=dump/birdclef2025_reshape_5s/list/train.txt,train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025,train.dataset.validation.list_path=dump/birdclef2025_reshape_5s/list/validation.txt,train.output.exp_dir=./exp/20250428-032422,train.output.tensorboard_dir=./tensorboard/20250428-032422,train.resume.continue_from=,train=birdclef2025_reshape_efficientnet_b0
136
+ id: ???
137
+ num: ???
138
+ config_name: config
139
+ env_set: {}
140
+ env_copy: []
141
+ config:
142
+ override_dirname:
143
+ kv_sep: '='
144
+ item_sep: ','
145
+ exclude_keys: []
146
+ runtime:
147
+ version: 1.3.2
148
+ version_base: '1.2'
149
+ cwd: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0
150
+ config_sources:
151
+ - path: hydra.conf
152
+ schema: pkg
153
+ provider: hydra
154
+ - path: /usr/local/lib/python3.10/dist-packages/audyn/configs
155
+ schema: file
156
+ provider: main
157
+ - path: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/conf
158
+ schema: file
159
+ provider: command-line
160
+ - path: ''
161
+ schema: structured
162
+ provider: schema
163
+ output_dir: /kaggle/working/BirdCLEF2025/recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425
164
+ choices:
165
+ criterion: birdclef2025_categorical_cross_entropy
166
+ lr_scheduler: none
167
+ optimizer: adam
168
+ model: birdclef2025_efficientnet_b0
169
+ test: default
170
+ test/dataloader: default
171
+ test/dataset: default
172
+ train: birdclef2025_reshape_efficientnet_b0
173
+ train/record: default
174
+ train/clip_gradient: default
175
+ train/dataloader: default
176
+ train/dataset: birdclef2025_primary-label
177
+ data: birdclef2025_reshape_5s
178
+ preprocess: birdclef2025
179
+ system: cuda
180
+ hydra/env: default
181
+ hydra/callbacks: null
182
+ hydra/job_logging: default
183
+ hydra/hydra_logging: default
184
+ hydra/hydra_help: default
185
+ hydra/help: default
186
+ hydra/sweeper: basic
187
+ hydra/launcher: basic
188
+ hydra/output: default
189
+ verbose: false
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/overrides.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - system=cuda
2
+ - preprocess=birdclef2025
3
+ - data=birdclef2025_reshape_5s
4
+ - train=birdclef2025_reshape_efficientnet_b0
5
+ - model=birdclef2025_efficientnet_b0
6
+ - optimizer=adam
7
+ - lr_scheduler=none
8
+ - criterion=birdclef2025_categorical_cross_entropy
9
+ - preprocess.dump_format=birdclef2025
10
+ - train.dataset.train.list_path=dump/birdclef2025_reshape_5s/list/train.txt
11
+ - train.dataset.train.feature_dir=/kaggle/input/birdclef-2025
12
+ - train.dataset.validation.list_path=dump/birdclef2025_reshape_5s/list/validation.txt
13
+ - train.dataset.validation.feature_dir=/kaggle/input/birdclef-2025
14
+ - train.resume.continue_from=
15
+ - train.output.exp_dir=./exp/20250428-032422
16
+ - train.output.tensorboard_dir=./tensorboard/20250428-032422
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/.hydra/resolved_config.yaml ADDED
@@ -0,0 +1,280 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ system:
2
+ seed: 0
3
+ distributed:
4
+ enable: null
5
+ nodes: null
6
+ nproc_per_node: null
7
+ backend: null
8
+ init_method: null
9
+ rdzv_id: null
10
+ rdzv_backend: null
11
+ rdzv_endpoint: null
12
+ max_restarts: null
13
+ cudnn:
14
+ benchmark: true
15
+ deterministic: false
16
+ amp:
17
+ enable: false
18
+ dtype: null
19
+ accelerator: cuda
20
+ compile:
21
+ enable: false
22
+ kwargs: null
23
+ preprocess:
24
+ dump_format: birdclef2025
25
+ list_path: null
26
+ wav_dir: null
27
+ feature_dir: null
28
+ max_workers: 2
29
+ max_shard_size: 1000000000
30
+ vad:
31
+ raw_root: null
32
+ trimmed_root: null
33
+ threshold: null
34
+ min_duration: 15
35
+ csv_path: ???
36
+ submission_path: ???
37
+ audio_root: ???
38
+ subset: ???
39
+ train_ratio: 0.8
40
+ data:
41
+ audio:
42
+ sample_rate: 32000
43
+ duration: 5
44
+ melspectrogram:
45
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
46
+ sample_rate: 32000
47
+ hop_length: 512
48
+ f_min: 20
49
+ f_max: 16000
50
+ pad: 0
51
+ n_mels: 128
52
+ window_fn:
53
+ _target_: torch.hann_window
54
+ _partial_: true
55
+ power: 1.0
56
+ normalized: false
57
+ wkwargs: null
58
+ center: true
59
+ pad_mode: constant
60
+ onesided: null
61
+ norm: slaney
62
+ mel_scale: slaney
63
+ take_log: true
64
+ freq_mask_param:
65
+ - 0.06
66
+ - 0.1
67
+ time_mask_param:
68
+ - 0.06
69
+ - 0.12
70
+ eps: null
71
+ train:
72
+ dataset:
73
+ train:
74
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
75
+ list_path: dump/birdclef2025_reshape_5s/list/train.txt
76
+ feature_dir: /kaggle/input/birdclef-2025
77
+ audio_key: audio
78
+ sample_rate_key: sample_rate
79
+ label_name_key: primary_label
80
+ filename_key: filename
81
+ validation:
82
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025PrimaryLabelDataset
83
+ list_path: dump/birdclef2025_reshape_5s/list/validation.txt
84
+ feature_dir: /kaggle/input/birdclef-2025
85
+ audio_key: audio
86
+ sample_rate_key: sample_rate
87
+ label_name_key: primary_label
88
+ filename_key: filename
89
+ dataloader:
90
+ train:
91
+ _target_: torch.utils.data.DataLoader
92
+ batch_size: 64
93
+ shuffle: true
94
+ collate_fn:
95
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineCollator
96
+ composer:
97
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
98
+ melspectrogram_transform:
99
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
100
+ sample_rate: 32000
101
+ hop_length: 512
102
+ f_min: 20
103
+ f_max: 16000
104
+ pad: 0
105
+ n_mels: 128
106
+ window_fn:
107
+ _target_: torch.hann_window
108
+ _partial_: true
109
+ power: 1.0
110
+ normalized: false
111
+ wkwargs: null
112
+ center: true
113
+ pad_mode: constant
114
+ onesided: null
115
+ norm: slaney
116
+ mel_scale: slaney
117
+ take_log: true
118
+ freq_mask_param:
119
+ - 0.06
120
+ - 0.1
121
+ time_mask_param:
122
+ - 0.06
123
+ - 0.12
124
+ eps: null
125
+ audio_key: audio
126
+ sample_rate_key: sample_rate
127
+ label_name_key: primary_label
128
+ filename_key: filename
129
+ waveform_key: waveform
130
+ melspectrogram_key: log_melspectrogram
131
+ label_index_key: label_index
132
+ sample_rate: 32000
133
+ duration: 5
134
+ decode_audio_as_waveform: true
135
+ decode_audio_as_monoral: true
136
+ training: true
137
+ target_shape: 256
138
+ melspectrogram_key: log_melspectrogram
139
+ label_index_key: label_index
140
+ alpha: 0.4
141
+ num_workers: 2
142
+ validation:
143
+ _target_: torch.utils.data.DataLoader
144
+ batch_size: 64
145
+ shuffle: false
146
+ collate_fn:
147
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025BaselineValidationCollator
148
+ composer:
149
+ _target_: birdclef2025.utils.data.birdclef.BirdCLEF2025ReshapePrimaryLabelComposer
150
+ melspectrogram_transform:
151
+ _target_: birdclef2025.transforms.birdclef.BirdCLEF2024BaselineMelSpectrogram
152
+ sample_rate: 32000
153
+ hop_length: 512
154
+ f_min: 20
155
+ f_max: 16000
156
+ pad: 0
157
+ n_mels: 128
158
+ window_fn:
159
+ _target_: torch.hann_window
160
+ _partial_: true
161
+ power: 1.0
162
+ normalized: false
163
+ wkwargs: null
164
+ center: true
165
+ pad_mode: constant
166
+ onesided: null
167
+ norm: slaney
168
+ mel_scale: slaney
169
+ take_log: true
170
+ freq_mask_param:
171
+ - 0.06
172
+ - 0.1
173
+ time_mask_param:
174
+ - 0.06
175
+ - 0.12
176
+ eps: null
177
+ audio_key: audio
178
+ sample_rate_key: sample_rate
179
+ label_name_key: primary_label
180
+ filename_key: filename
181
+ waveform_key: waveform
182
+ melspectrogram_key: log_melspectrogram
183
+ label_index_key: label_index
184
+ sample_rate: 32000
185
+ duration: 5
186
+ decode_audio_as_waveform: true
187
+ decode_audio_as_monoral: true
188
+ training: false
189
+ target_shape: 256
190
+ melspectrogram_key: log_melspectrogram
191
+ label_index_key: label_index
192
+ num_workers: 2
193
+ clip_gradient: {}
194
+ record: {}
195
+ trainer:
196
+ _target_: birdclef2025.utils.driver.BaseTrainer
197
+ key_mapping:
198
+ train:
199
+ input:
200
+ input: log_melspectrogram
201
+ output: logit
202
+ validation:
203
+ input:
204
+ input: log_melspectrogram
205
+ output: logit
206
+ inference:
207
+ input:
208
+ input: log_melspectrogram
209
+ output: logit
210
+ ddp_kwargs: null
211
+ resume:
212
+ continue_from: ''
213
+ output:
214
+ exp_dir: ./exp/20250428-032422
215
+ tensorboard_dir: ./tensorboard/20250428-032422
216
+ save_checkpoint:
217
+ iteration:
218
+ every: 1000
219
+ path: ./exp/20250428-032422/model/iteration{iteration}.pth
220
+ epoch:
221
+ every: 1
222
+ path: ./exp/20250428-032422/model/epoch{epoch}.pth
223
+ last:
224
+ path: ./exp/20250428-032422/model/last.pth
225
+ best_epoch:
226
+ path: ./exp/20250428-032422/model/best_epoch.pth
227
+ steps:
228
+ epochs: 10
229
+ iterations: null
230
+ lr_scheduler: epoch
231
+ test:
232
+ dataset:
233
+ test:
234
+ _target_: torch.utils.data.Dataset
235
+ dataloader:
236
+ test:
237
+ _target_: torch.utils.data.DataLoader
238
+ batch_size: 1
239
+ shuffle: false
240
+ key_mapping:
241
+ inference:
242
+ input: null
243
+ output: null
244
+ identifier: null
245
+ checkpoint: null
246
+ remove_weight_norm: null
247
+ output:
248
+ exp_dir: ./exp
249
+ inference_dir: ./exp/inference
250
+ audio:
251
+ sample_rate: 32000
252
+ key_mapping:
253
+ inference:
254
+ output: null
255
+ reference: null
256
+ transforms:
257
+ inference:
258
+ output: null
259
+ reference: null
260
+ ddp_kwargs: null
261
+ model:
262
+ _target_: birdclef2025.models.EfficientNetB0
263
+ weights: IMAGENET1K_V1
264
+ num_classes: 206
265
+ optimizer:
266
+ _target_: torch.optim.Adam
267
+ lr_scheduler: {}
268
+ criterion:
269
+ _target_: audyn.criterion.MultiCriteria
270
+ cross_entropy:
271
+ _target_: audyn.criterion.BaseCriterionWrapper
272
+ criterion:
273
+ _target_: torch.nn.CrossEntropyLoss
274
+ reduction: mean
275
+ weight: 1
276
+ key_mapping:
277
+ estimated:
278
+ input: logit
279
+ target:
280
+ target: label_index
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/log/20250428-032425/train.log ADDED
The diff for this file is too large to render. See raw diff
 
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/model/best_epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58a676b0a4caf0423c81870af00dfc88979e4f52eb499e25bc835d3dcb3ae709
3
+ size 51764965
recipes/BirdCLEF2025/EfficientNetB0/exp/20250428-032422/model/last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cf93364f17ff21617df6fee6c0ae03585377b160ee9e3b2e124ad19c20aef38
3
+ size 51716323
recipes/BirdCLEF2025/EfficientNetB0/exp/20250429-075315/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ system=default_seed-1
2
+ data=birdclef2025_reshape_15s
3
+ train=birdclef2025_reshape_efficientnet_b0
4
+ model=birdclef2025_efficientnet_b0
5
+ criterion=birdclef2025_categorical_cross_entropy
6
+
7
+ public_score: 0.515