audio-spatializer / config.json
soundsol's picture
Upload config.json with huggingface_hub
5b3d971 verified
{
"model_type": "audio-spatializer",
"architecture": "CrossAttnSpatializer",
"sample_rate": 24000,
"n_fft": 1024,
"hop_length": 512,
"n_mels": 128,
"audio_embed_dim": 512,
"text_embed_dim": 512,
"nhead": 8,
"num_layers": 6,
"output_channels": 4,
"output_format": "foa",
"training": {
"framework": "pytorch-lightning",
"final_epoch": 14,
"final_step": 342,
"checkpoint": "epoch=14-step=342.ckpt"
},
"spatial_parameters": {
"direction": ["front", "front-left", "left", "back-left", "back", "back-right", "right", "front-right"],
"elevation": ["down", "level", "up"],
"distance": ["near", "mid", "far"],
"room_size": ["small", "medium", "large"],
"reverb": ["dry", "medium", "wet"]
}
}