Update config.json
Browse files- config.json +3 -3
config.json
CHANGED
|
@@ -45,7 +45,7 @@
|
|
| 45 |
"latent_dim": 128,
|
| 46 |
"downsampling_ratio": 480,
|
| 47 |
"sample_rate": 24000,
|
| 48 |
-
"pretrained_ckpt": "/
|
| 49 |
"bottleneck": {
|
| 50 |
"_target_": "models.autoencoder.waveform.stable_vae.VAEBottleneck"
|
| 51 |
}
|
|
@@ -90,11 +90,11 @@
|
|
| 90 |
"_target_": "models.content_encoder.caption_encoder.ContentEncoder",
|
| 91 |
"text_encoder": {
|
| 92 |
"_target_": "models.content_encoder.text_encoder.T5TextEncoder",
|
| 93 |
-
"model_name": "/
|
| 94 |
}
|
| 95 |
},
|
| 96 |
"frame_resolution": 0.005,
|
| 97 |
-
"noise_scheduler_name": "
|
| 98 |
"snr_gamma": 5.0,
|
| 99 |
"classifier_free_guidance": true,
|
| 100 |
"cfg_drop_ratio": 0.2,
|
|
|
|
| 45 |
"latent_dim": 128,
|
| 46 |
"downsampling_ratio": 480,
|
| 47 |
"sample_rate": 24000,
|
| 48 |
+
"pretrained_ckpt": "ezaudio_vae/1m.pt",
|
| 49 |
"bottleneck": {
|
| 50 |
"_target_": "models.autoencoder.waveform.stable_vae.VAEBottleneck"
|
| 51 |
}
|
|
|
|
| 90 |
"_target_": "models.content_encoder.caption_encoder.ContentEncoder",
|
| 91 |
"text_encoder": {
|
| 92 |
"_target_": "models.content_encoder.text_encoder.T5TextEncoder",
|
| 93 |
+
"model_name": "google/flan-t5-large"
|
| 94 |
}
|
| 95 |
},
|
| 96 |
"frame_resolution": 0.005,
|
| 97 |
+
"noise_scheduler_name": "stabilityai-stable-diffusion-2-1",
|
| 98 |
"snr_gamma": 5.0,
|
| 99 |
"classifier_free_guidance": true,
|
| 100 |
"cfg_drop_ratio": 0.2,
|