lucasnewman commited on
Commit
8126572
·
verified ·
1 Parent(s): 3096256

Upload 3 files

Browse files
Files changed (3) hide show
  1. config.json +46 -0
  2. model.safetensors +3 -0
  3. pca_state.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "echo_tts",
3
+ "sample_rate": 44100,
4
+ "max_text_length": 768,
5
+ "max_speaker_latent_length": 6400,
6
+ "audio_downsample_factor": 2048,
7
+ "normalize_text": true,
8
+ "delete_blockwise_modules": false,
9
+ "pca_filename": "pca_state.safetensors",
10
+ "fish_codec_repo": "jordand/fish-s1-dac-min",
11
+ "model_path": "mlx_echo_tts_base",
12
+ "dit": {
13
+ "latent_size": 80,
14
+ "model_size": 2048,
15
+ "num_layers": 24,
16
+ "num_heads": 16,
17
+ "intermediate_size": 5888,
18
+ "norm_eps": 1e-05,
19
+ "text_vocab_size": 256,
20
+ "text_model_size": 1280,
21
+ "text_num_layers": 14,
22
+ "text_num_heads": 10,
23
+ "text_intermediate_size": 3328,
24
+ "speaker_patch_size": 4,
25
+ "speaker_model_size": 1280,
26
+ "speaker_num_layers": 14,
27
+ "speaker_num_heads": 10,
28
+ "speaker_intermediate_size": 3328,
29
+ "timestep_embed_size": 512,
30
+ "adaln_rank": 256
31
+ },
32
+ "sampler": {
33
+ "num_steps": 40,
34
+ "cfg_scale_text": 3.0,
35
+ "cfg_scale_speaker": 8.0,
36
+ "cfg_min_t": 0.5,
37
+ "cfg_max_t": 1.0,
38
+ "truncation_factor": null,
39
+ "rescale_k": null,
40
+ "rescale_sigma": null,
41
+ "speaker_kv_scale": null,
42
+ "speaker_kv_max_layers": null,
43
+ "speaker_kv_min_t": null,
44
+ "sequence_length": 640
45
+ }
46
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9581018e48dc91414dd290d349527e1bd8cac1cb5797ab4df1c1daa04f359a1
3
+ size 5601645999
pca_state.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64f6ca51a4afa9b0e48676dafb2c3190fdbff31fca5983b66f3210350bd8eec9
3
+ size 332044