valhalla commited on
Commit
2dade0b
·
1 Parent(s): 495f99a

add model

Browse files
model_index.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "GradTTS",
3
+ "_diffusers_version": "0.0.3",
4
+ "_module": "pipeline_grad_tts",
5
+ "noise_scheduler": [
6
+ "diffusers",
7
+ "GradTTSScheduler"
8
+ ],
9
+ "text_encoder": [
10
+ "pipeline_grad_tts",
11
+ "TextEncoder"
12
+ ],
13
+ "tokenizer": [
14
+ "grad_tts_utils",
15
+ "GradTTSTokenizer"
16
+ ],
17
+ "unet": [
18
+ "diffusers",
19
+ "UNetGradTTSModel"
20
+ ]
21
+ }
noise_scheduler/scheduler_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "GradTTSScheduler",
3
+ "_diffusers_version": "0.0.3",
4
+ "beta_end": 20.0,
5
+ "beta_start": 0.05,
6
+ "timesteps": 50
7
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "TextEncoder",
3
+ "_diffusers_version": "0.0.3",
4
+ "filter_channels": 768,
5
+ "filter_channels_dp": 256,
6
+ "kernel_size": 3,
7
+ "n_channels": 192,
8
+ "n_feats": 80,
9
+ "n_heads": 2,
10
+ "n_layers": 6,
11
+ "n_spks": 1,
12
+ "n_vocab": 149,
13
+ "name_or_path": "grad-tts/text_encoder",
14
+ "p_dropout": 0.1,
15
+ "spk_emb_dim": 64,
16
+ "window_size": 4
17
+ }
text_encoder/diffusion_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00f47ce1fe4f1f2eee3b3f3716d0382bbfc8c56708887f721a44ff4944cb88f3
3
+ size 28845619
tokenizer/dict_file.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "name_or_path": "grad-tts/tokenizer",
3
+ "special_tokens_map_file": "./grad-tts-tokenizer/special_tokens_map.json",
4
+ "tokenizer_class": "GradTTSTokenizer"
5
+ }
unet/config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNetGradTTSModel",
3
+ "_diffusers_version": "0.0.3",
4
+ "dim": 64,
5
+ "dim_mults": [
6
+ 1,
7
+ 2,
8
+ 4
9
+ ],
10
+ "groups": 8,
11
+ "n_feats": 80,
12
+ "n_spks": 247,
13
+ "name_or_path": "grad-tts/unet",
14
+ "pe_scale": 1000,
15
+ "spk_emb_dim": 64
16
+ }
unet/diffusion_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df39c3b01dbc76477f61a5403663a00df92e9c26cbbd6974fce3e8801a5084e4
3
+ size 30816799