ZDisket commited on
Commit
9c95d02
·
verified ·
1 Parent(s): 47ca3e1

Upload 4 files

Browse files
checkpoint_epoch_016.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cee00ed28f365839855dfcd954a671d96ab65dfd3848b69e021f890e7be3e13
3
+ size 565705894
torchscript/model_config.yaml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ # Configuration for MQGAN training
3
+
4
+ project_name: "MQGAN"
5
+
6
+ data:
7
+ data_dir: '../hifispeech4_CORS'
8
+ output_dir: 'logs/mqgan_speech4_varcrop_newd'
9
+ validation_split: 0.02
10
+ crop_len: [256, 192, 128]
11
+ batch_size: 16
12
+ num_workers: 0
13
+
14
+ model:
15
+ mel_channels: 128 # Number of mel frequency channels
16
+ generator:
17
+ channels: [512, 512, 512, 768]
18
+ kernel_sizes: [3, 3, 5, 7]
19
+ dropout: 0.1
20
+ fsq_levels: [8, 5, 5, 5]
21
+ refiner_base_channels: 64
22
+ refiner_depth: 3
23
+ discriminator_patch:
24
+ hidden_channels: [256, 256, 384, 512, 512]
25
+ kernel_sizes: [5, 5, 5, 3, 3, 3]
26
+ strides: [[1,2], [2,2], [2,2], [2,1], [2,1], [2,1]]
27
+ discriminator_multibin:
28
+ hidden_channels: [128, 128, 256, 256, 384]
29
+ kernel_sizes: [7, 5, 3, 3, 3, 3]
30
+ n_bins: 8
31
+ n_no_strides: 2
32
+
33
+ training:
34
+ num_epochs: 1000
35
+ lr: 0.0001
36
+ beta1: 0.9
37
+ beta2: 0.999
38
+ lr_d_factor: 1.15
39
+ d_beta1: 0.5
40
+ d_beta2: 0.999
41
+ warmup_steps: 1000
42
+ discriminator_train_start_epoch: 10
43
+ loss_weights:
44
+ fm_lambda: 0.25
45
+ Gloss_lambda: 15.0
46
+ recon_lambda: 15.0
47
+ use_fm_loss: False
48
+ seed: 42
49
+ no_cuda: False
50
+ pretrained: null # path to pretrained model, or null
51
+
52
+ logging:
53
+ eval_interval: 2
54
+ save_interval: 2
55
+ num_plot_examples: 10
56
+ wandb:
57
+ entity: null # Your wandb entity
58
+ project: "MQGAN"
torchscript/model_cpu.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb9e707d46c74c2bae749098eefce5948a8fb074a12dbac293ba0ceb7fba0e6
3
+ size 122733945
torchscript/model_cuda.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32957f617e363ab6dd4754c1aef7cfd51291b8d20b343b6c315fd53a8773be8f
3
+ size 122755366