| { | |
| "model": { | |
| "sampling_rate": 44100, | |
| "block_size": 512, | |
| "hidden_size": 128, | |
| "num_layers": 8, | |
| "spk_embed_dim": 256 | |
| }, | |
| "dataset": { | |
| "train_path": "dataset/44k/voice_sample", | |
| "val_path": "dataset/44k/voice_sample" | |
| } | |
| } | |
| { | |
| "model": { | |
| "sampling_rate": 44100, | |
| "block_size": 512, | |
| "hidden_size": 128, | |
| "num_layers": 8, | |
| "spk_embed_dim": 256 | |
| }, | |
| "dataset": { | |
| "train_path": "dataset/44k/voice_sample", | |
| "val_path": "dataset/44k/voice_sample" | |
| } | |
| } | |