benjamin-paine commited on
Commit
ddfdb79
·
verified ·
1 Parent(s): a4855ff

Delete speech-synthesis-xtts-v2.py

Browse files
Files changed (1) hide show
  1. speech-synthesis-xtts-v2.py +0 -163
speech-synthesis-xtts-v2.py DELETED
@@ -1,163 +0,0 @@
1
- return {
2
- "config": XttsConfig(
3
- output_path="output",
4
- logger_uri=None,
5
- run_name="run",
6
- project_name=None,
7
- run_description="🐸Coqui trainer run.",
8
- print_step=25,
9
- plot_step=100,
10
- model_param_stats=False,
11
- wandb_entity=None,
12
- dashboard_logger="tensorboard",
13
- save_on_interrupt=True,
14
- log_model_step=None,
15
- save_step=10000,
16
- save_n_checkpoints=5,
17
- save_checkpoints=True,
18
- save_all_best=False,
19
- save_best_after=10000,
20
- target_loss=None,
21
- print_eval=False,
22
- test_delay_epochs=0,
23
- run_eval=True,
24
- run_eval_steps=None,
25
- distributed_backend="nccl",
26
- distributed_url="tcp://localhost:54321",
27
- mixed_precision=False,
28
- precision="fp16",
29
- epochs=1000,
30
- batch_size=32,
31
- eval_batch_size=16,
32
- grad_clip=0.0,
33
- scheduler_after_epoch=True,
34
- lr=0.001,
35
- optimizer="radam",
36
- optimizer_params=None,
37
- lr_scheduler=None,
38
- lr_scheduler_params={},
39
- use_grad_scaler=False,
40
- allow_tf32=False,
41
- cudnn_enable=True,
42
- cudnn_deterministic=False,
43
- cudnn_benchmark=False,
44
- training_seed=54321,
45
- model="xtts",
46
- num_loader_workers=0,
47
- num_eval_loader_workers=0,
48
- use_noise_augment=False,
49
- audio=XttsAudioConfig(sample_rate=22050, output_sample_rate=24000),
50
- use_phonemes=False,
51
- phonemizer=None,
52
- phoneme_language=None,
53
- compute_input_seq_cache=False,
54
- text_cleaner=None,
55
- enable_eos_bos_chars=False,
56
- test_sentences_file="",
57
- phoneme_cache_path=None,
58
- characters=None,
59
- add_blank=False,
60
- batch_group_size=0,
61
- loss_masking=None,
62
- min_audio_len=1,
63
- max_audio_len=inf,
64
- min_text_len=1,
65
- max_text_len=inf,
66
- compute_f0=False,
67
- compute_energy=False,
68
- compute_linear_spec=False,
69
- precompute_num_workers=0,
70
- start_by_longest=False,
71
- shuffle=False,
72
- drop_last=False,
73
- datasets=[
74
- BaseDatasetConfig(
75
- formatter="",
76
- dataset_name="",
77
- path="",
78
- meta_file_train="",
79
- ignored_speakers=None,
80
- language="",
81
- phonemizer="",
82
- meta_file_val="",
83
- meta_file_attn_mask="",
84
- )
85
- ],
86
- test_sentences=[],
87
- eval_split_max_size=None,
88
- eval_split_size=0.01,
89
- use_speaker_weighted_sampler=False,
90
- speaker_weighted_sampler_alpha=1.0,
91
- use_language_weighted_sampler=False,
92
- language_weighted_sampler_alpha=1.0,
93
- use_length_weighted_sampler=False,
94
- length_weighted_sampler_alpha=1.0,
95
- model_args=XttsArgs(
96
- gpt_batch_size=1,
97
- enable_redaction=False,
98
- kv_cache=True,
99
- gpt_checkpoint=None,
100
- clvp_checkpoint=None,
101
- decoder_checkpoint=None,
102
- num_chars=255,
103
- tokenizer_file="",
104
- gpt_max_audio_tokens=605,
105
- gpt_max_text_tokens=402,
106
- gpt_max_prompt_tokens=70,
107
- gpt_layers=30,
108
- gpt_n_model_channels=1024,
109
- gpt_n_heads=16,
110
- gpt_number_text_tokens=6681,
111
- gpt_start_text_token=None,
112
- gpt_stop_text_token=None,
113
- gpt_num_audio_tokens=1026,
114
- gpt_start_audio_token=1024,
115
- gpt_stop_audio_token=1025,
116
- gpt_code_stride_len=1024,
117
- gpt_use_masking_gt_prompt_approach=True,
118
- gpt_use_perceiver_resampler=True,
119
- input_sample_rate=22050,
120
- output_sample_rate=24000,
121
- output_hop_length=256,
122
- decoder_input_dim=1024,
123
- d_vector_dim=512,
124
- cond_d_vector_in_each_upsampling_layer=True,
125
- duration_const=102400,
126
- ),
127
- model_dir=None,
128
- languages=[
129
- "en",
130
- "es",
131
- "fr",
132
- "de",
133
- "it",
134
- "pt",
135
- "pl",
136
- "tr",
137
- "ru",
138
- "nl",
139
- "cs",
140
- "ar",
141
- "zh-cn",
142
- "hu",
143
- "ko",
144
- "ja",
145
- "hi",
146
- ],
147
- temperature=0.75,
148
- length_penalty=1.0,
149
- repetition_penalty=5.0,
150
- top_k=50,
151
- top_p=0.85,
152
- num_gpt_outputs=1,
153
- gpt_cond_len=30,
154
- gpt_cond_chunk_len=4,
155
- max_ref_len=30,
156
- sound_norm_refs=False,
157
- ),
158
- "scaler": None,
159
- "optimizer": None,
160
- "step": 10000000,
161
- "date": "2021-10-20 12:00:00",
162
- "model_loss": None,
163
- }