| { | |
| "model_type": "lna", | |
| "description": "Learning Noise Adapters (LNA) — SepFormer backbone pretrained on 10 noise types (Session 0)", | |
| "sepformer": { | |
| "N": 256, | |
| "L": 16, | |
| "B": 256, | |
| "H": 512, | |
| "num_layers": 8, | |
| "num_blocks": 2, | |
| "nhead": 8, | |
| "d_ffn": 1024, | |
| "dropout": 0.1, | |
| "causal": false | |
| }, | |
| "adapter": { | |
| "bottleneck_dim": 1, | |
| "use_ffl_adapter": true, | |
| "use_mha_adapter": true, | |
| "activation": "relu", | |
| "init_scale": 0.01 | |
| }, | |
| "training": { | |
| "loss": "si_snr", | |
| "optimizer": "adam", | |
| "learning_rate": 0.00015, | |
| "pretrain_epochs": 40, | |
| "incremental_epochs": 20, | |
| "sample_rate": 8000 | |
| }, | |
| "session0_noises": [ | |
| "babble", "buccaneer1", "buccaneer2", "destroyerengine", | |
| "factory1", "factory2", "hfchannel", "leopard", "pink", "white" | |
| ] | |
| } | |