Chebukkk
/

mansi-xttsv2

Model card Files Files and versions

Chebukkk commited on Oct 7, 2025

Commit

ab185af

·

verified ·

1 Parent(s): 0eab8a7

Upload config.json

Files changed (1) hide show

config.json +81 -0

config.json ADDED Viewed

	@@ -0,0 +1,81 @@

+{
+  "model_type": "xtts",
+  "audio": {
+    "sample_rate": 22050,
+    "output_sample_rate": 24000,
+    "dvae_sample_rate": 22050
+  },
+  "model_args": {
+    "gpt_batch_size": 1,
+    "enable_redaction": false,
+    "kv_cache": true,
+    "gpt_checkpoint": "model.pth",
+    "clvp_checkpoint": null,
+    "decoder_checkpoint": null,
+    "num_chars": 255,
+    "tokenizer_file": "vocab.json",
+    "gpt_max_audio_tokens": 605,
+    "gpt_max_text_tokens": 402,
+    "gpt_max_prompt_tokens": 70,
+    "gpt_layers": 30,
+    "gpt_n_model_channels": 1024,
+    "gpt_n_heads": 16,
+    "gpt_number_text_tokens": 8456,
+    "gpt_start_text_token": 261,
+    "gpt_stop_text_token": 0,
+    "gpt_num_audio_tokens": 1026,
+    "gpt_start_audio_token": 1024,
+    "gpt_stop_audio_token": 1025,
+    "gpt_code_stride_len": 1024,
+    "gpt_use_masking_gt_prompt_approach": true,
+    "gpt_use_perceiver_resampler": true,
+    "input_sample_rate": 22050,
+    "output_sample_rate": 24000,
+    "output_hop_length": 256,
+    "decoder_input_dim": 1024,
+    "d_vector_dim": 512,
+    "cond_d_vector_in_each_upsampling_layer": true,
+    "duration_const": 102400,
+    "min_conditioning_length": 11025,
+    "max_conditioning_length": 132300,
+    "gpt_loss_text_ce_weight": 0.01,
+    "gpt_loss_mel_ce_weight": 1.0,
+    "debug_loading_failures": false,
+    "max_wav_length": 330750,
+    "max_text_length": 400,
+    "mel_norm_file": "mel_stats.pth",
+    "dvae_checkpoint": "dvae.pth",
+    "xtts_checkpoint": "model.pth",
+    "vocoder": ""
+  },
+  "languages": [
+    "en",
+    "es",
+    "fr",
+    "de",
+    "it",
+    "pt",
+    "pl",
+    "tr",
+    "ru",
+    "nl",
+    "cs",
+    "ar",
+    "zh-cn",
+    "hu",
+    "ko",
+    "ja",
+    "hi",
+    "mns"
+  ],
+  "temperature": 0.75,
+  "length_penalty": 1.0,
+  "repetition_penalty": 5.0,
+  "top_k": 50,
+  "top_p": 0.85,
+  "num_gpt_outputs": 1,
+  "gpt_cond_len": 30,
+  "gpt_cond_chunk_len": 4,
+  "max_ref_len": 30,
+  "sound_norm_refs": false
+}