benghoula commited on
Commit
1616725
·
verified ·
1 Parent(s): a5f0e9f

Upload model

Browse files
Files changed (2) hide show
  1. config.json +5 -4
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,7 +1,8 @@
1
  {
 
2
  "activation_dropout": 0.1,
3
  "architectures": [
4
- "VitsModelForPreTraining"
5
  ],
6
  "attention_dropout": 0.1,
7
  "depth_separable_channels": 2,
@@ -51,7 +52,7 @@
51
  "noise_scale_duration": 0.8,
52
  "num_attention_heads": 2,
53
  "num_hidden_layers": 6,
54
- "num_speakers": 1,
55
  "posterior_encoder_num_wavenet_layers": 16,
56
  "prior_encoder_num_flows": 4,
57
  "prior_encoder_num_wavenet_layers": 4,
@@ -79,11 +80,11 @@
79
  ],
80
  "sampling_rate": 16000,
81
  "segment_size": 8192,
82
- "speaker_embedding_size": 0,
83
  "speaking_rate": 1.0,
84
  "spectrogram_bins": 513,
85
  "torch_dtype": "float32",
86
- "transformers_version": "4.43.3",
87
  "upsample_initial_channel": 512,
88
  "upsample_kernel_sizes": [
89
  16,
 
1
  {
2
+ "_name_or_path": "/home/adem/finetuned_tts_tn",
3
  "activation_dropout": 0.1,
4
  "architectures": [
5
+ "VitsModel"
6
  ],
7
  "attention_dropout": 0.1,
8
  "depth_separable_channels": 2,
 
52
  "noise_scale_duration": 0.8,
53
  "num_attention_heads": 2,
54
  "num_hidden_layers": 6,
55
+ "num_speakers": 8,
56
  "posterior_encoder_num_wavenet_layers": 16,
57
  "prior_encoder_num_flows": 4,
58
  "prior_encoder_num_wavenet_layers": 4,
 
80
  ],
81
  "sampling_rate": 16000,
82
  "segment_size": 8192,
83
+ "speaker_embedding_size": 256,
84
  "speaking_rate": 1.0,
85
  "spectrogram_bins": 513,
86
  "torch_dtype": "float32",
87
+ "transformers_version": "4.35.1",
88
  "upsample_initial_channel": 512,
89
  "upsample_kernel_sizes": [
90
  16,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0428f1a559b9eb1140f27dafb70b52964bf54eea7dee78cbf575f1db73fb306d
3
- size 332161480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af1d78e621e71416a1241b32bd65221a0889c57bcbf53943e69314dc6ca733a5
3
+ size 158647032