{ "latent_dim": 256, "n_pitches": 88, "seg_frames": 32, "pitch_min": 21, "pitch_max": 108, "architecture": "CNN-VAE" }