BernardoTorres commited on Oct 13, 2025

Commit

5408758

verified ·

1 Parent(s): 4f561af

Upload folder using huggingface_hub

Files changed (20) hide show

0a3afbec_weights/autoencoder_inference_model_best.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4311d9460c04b18acde791c4e3348f101e3d971cc78fd27729bbd90b4f145efd
+size 232976270

0a3afbec_weights/autoencoder_inference_model_last.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:60838454393ea3991c000d98c483303607888e7eac013b3d33f7402adea71b97
+size 232976270

0a3afbec_weights/diffusion_kwargs_best.yaml ADDED Viewed

+base_step: 0.1
+end_exp: 2.0
+p_mean: -1.1
+p_std: 2.0
+rho: 7.0
+schedule: exponential
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+start_exp: 1.0
+total_iters: 800000
+use_lognormal: true

0a3afbec_weights/diffusion_kwargs_last.yaml ADDED Viewed

+base_step: 0.1
+end_exp: 2.0
+p_mean: -1.1
+p_std: 2.0
+rho: 7.0
+schedule: exponential
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+start_exp: 1.0
+total_iters: 800000
+use_lognormal: true

0a3afbec_weights/encoder_inference_model_best.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4402018f1ffb9ab261bf510fdc6f2d6743d700fc45c772ed8af9567d7157d26c
+size 65100948

0a3afbec_weights/encoder_inference_model_last.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e2ac2a3a9d61eef882dde6224a829b9b6802d543fdb5b50b378329f8cd9161d
+size 65100948

0a3afbec_weights/frontend_kwargs_best.yaml ADDED Viewed

+alpha_rescale: 0.65
+beta_rescale: 0.34
+hop_size: 512
+n_fft_factor: 4
+sample_rate: 44100

0a3afbec_weights/frontend_kwargs_last.yaml ADDED Viewed

+alpha_rescale: 0.65
+beta_rescale: 0.34
+hop_size: 512
+n_fft_factor: 4
+sample_rate: 44100

0a3afbec_weights/generator_kwargs_best.yaml ADDED Viewed

+attention_list:
+- 0
+- 0
+- 1
+- 1
+- 1
+attention_list_encoder:
+- 0
+- 0
+- 1
+- 1
+- 1
+base_channels: 64
+bottleneck_base_channels: 512
+bottleneck_channels: 64
+cond_channels: 256
+data_channels: 2
+dropout_rate: 0.0
+fourier_scale: 0.2
+freq_downsample_list:
+- 1
+- 0
+- 0
+- 0
+frequency_scaling: true
+heads: 4
+hop: 512
+init_as_zero: true
+layers_list:
+- 2
+- 2
+- 2
+- 2
+- 2
+layers_list_encoder:
+- 1
+- 1
+- 1
+- 1
+- 1
+min_res_dropout: 16
+multipliers_list:
+- 1
+- 2
+- 4
+- 4
+- 4
+normalization: true
+num_bottleneck_layers: 4
+pre_normalize_2d_to_1d: true
+pre_normalize_downsampling_encoder: true
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+use_fourier: false

0a3afbec_weights/generator_kwargs_last.yaml ADDED Viewed

+attention_list:
+- 0
+- 0
+- 1
+- 1
+- 1
+attention_list_encoder:
+- 0
+- 0
+- 1
+- 1
+- 1
+base_channels: 64
+bottleneck_base_channels: 512
+bottleneck_channels: 64
+cond_channels: 256
+data_channels: 2
+dropout_rate: 0.0
+fourier_scale: 0.2
+freq_downsample_list:
+- 1
+- 0
+- 0
+- 0
+frequency_scaling: true
+heads: 4
+hop: 512
+init_as_zero: true
+layers_list:
+- 2
+- 2
+- 2
+- 2
+- 2
+layers_list_encoder:
+- 1
+- 1
+- 1
+- 1
+- 1
+min_res_dropout: 16
+multipliers_list:
+- 1
+- 2
+- 4
+- 4
+- 4
+normalization: true
+num_bottleneck_layers: 4
+pre_normalize_2d_to_1d: true
+pre_normalize_downsampling_encoder: true
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+use_fourier: false

2f4c6d21_weights/autoencoder_inference_model_best.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0b9e50868159aaa1c96c9b5471154b3e71719f3842e18220a5272dbe27f1274
+size 232976270

2f4c6d21_weights/autoencoder_inference_model_last.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8b817f4f63ad52ec84c36f0c2cb1bd6b3e8e5bc513124a08dcb1eb992bd0986
+size 232976270

2f4c6d21_weights/diffusion_kwargs_best.yaml ADDED Viewed

+base_step: 0.1
+end_exp: 2.0
+p_mean: -1.1
+p_std: 2.0
+rho: 7.0
+schedule: exponential
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+start_exp: 1.0
+total_iters: 800000
+use_lognormal: true

2f4c6d21_weights/diffusion_kwargs_last.yaml ADDED Viewed

+base_step: 0.1
+end_exp: 2.0
+p_mean: -1.1
+p_std: 2.0
+rho: 7.0
+schedule: exponential
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+start_exp: 1.0
+total_iters: 800000
+use_lognormal: true

2f4c6d21_weights/encoder_inference_model_best.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c87fd5359299c1f423e331123cb346267a3a68881be3d4586a796d5fcf0b244
+size 65100948

2f4c6d21_weights/encoder_inference_model_last.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:44eaa9e4019aff4b940fec92fbed3d54c40694f66f3ea716d8e7da06d14b13e2
+size 65100948

2f4c6d21_weights/frontend_kwargs_best.yaml ADDED Viewed

+alpha_rescale: 0.65
+beta_rescale: 0.34
+hop_size: 512
+n_fft_factor: 4
+sample_rate: 44100

2f4c6d21_weights/frontend_kwargs_last.yaml ADDED Viewed

+alpha_rescale: 0.65
+beta_rescale: 0.34
+hop_size: 512
+n_fft_factor: 4
+sample_rate: 44100

2f4c6d21_weights/generator_kwargs_best.yaml ADDED Viewed

+attention_list:
+- 0
+- 0
+- 1
+- 1
+- 1
+attention_list_encoder:
+- 0
+- 0
+- 1
+- 1
+- 1
+base_channels: 64
+bottleneck_base_channels: 512
+bottleneck_channels: 64
+cond_channels: 256
+data_channels: 2
+dropout_rate: 0.0
+fourier_scale: 0.2
+freq_downsample_list:
+- 1
+- 0
+- 0
+- 0
+frequency_scaling: true
+heads: 4
+hop: 512
+init_as_zero: true
+layers_list:
+- 2
+- 2
+- 2
+- 2
+- 2
+layers_list_encoder:
+- 1
+- 1
+- 1
+- 1
+- 1
+min_res_dropout: 16
+multipliers_list:
+- 1
+- 2
+- 4
+- 4
+- 4
+normalization: true
+num_bottleneck_layers: 4
+pre_normalize_2d_to_1d: true
+pre_normalize_downsampling_encoder: true
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+use_fourier: false

2f4c6d21_weights/generator_kwargs_last.yaml ADDED Viewed

+attention_list:
+- 0
+- 0
+- 1
+- 1
+- 1
+attention_list_encoder:
+- 0
+- 0
+- 1
+- 1
+- 1
+base_channels: 64
+bottleneck_base_channels: 512
+bottleneck_channels: 64
+cond_channels: 256
+data_channels: 2
+dropout_rate: 0.0
+fourier_scale: 0.2
+freq_downsample_list:
+- 1
+- 0
+- 0
+- 0
+frequency_scaling: true
+heads: 4
+hop: 512
+init_as_zero: true
+layers_list:
+- 2
+- 2
+- 2
+- 2
+- 2
+layers_list_encoder:
+- 1
+- 1
+- 1
+- 1
+- 1
+min_res_dropout: 16
+multipliers_list:
+- 1
+- 2
+- 4
+- 4
+- 4
+normalization: true
+num_bottleneck_layers: 4
+pre_normalize_2d_to_1d: true
+pre_normalize_downsampling_encoder: true
+sigma_data: 0.5
+sigma_max: 80.0
+sigma_min: 0.002
+use_fourier: false