drakrig commited on
Commit
3d9d4f7
·
verified ·
1 Parent(s): 40bf866

Re-upload v3s weight and config

Browse files

v3s architecture with Conv1d projection with 16 output projections and GELU actibation

scorer_v3s_16_final/configs/vad_train_config.yaml ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ batch_size: 128
2
+ epochs: 20
3
+ learning_rate: 0.00001
4
+ weight_decay: 0.01
5
+
6
+ is_half: false
7
+ num_workers: 8
8
+ pin_memory: true
9
+
10
+ mel_encoder_path: /mnt/ML/models/GPT-SoVITS/vad_specific/ref_enc.pth
11
+ mel_encoder_sr: 32000
12
+ filter_length: 2048
13
+ gin_channels: 1024
14
+ hop_length: 640
15
+ projection_weights_path: /mnt/ML/models/GPT-SoVITS/vad_specific/linear_proj.pth
16
+ prelu_weights_path : /mnt/ML/models/GPT-SoVITS/vad_specific/prelu.pth
17
+ sv_model_path: /mnt/ML/models/GPT-SoVITS/sv/pretrained_eres2netv2w24s4ep4.ckpt
18
+ sv_model_sr: 16000
19
+ use_sv: true
20
+ win_length: 2048
21
+
22
+ shuffle: true
23
+ data_dir: /mnt/ML/Datasets/laions_got_talent_enhanced_flash_annotations_and_long_captions/extracted_audio/
24
+ annotations_file: vad_descriptions_resampled_normalized_v3.csv
25
+ test_size: 10000
26
+ limit_train_samples: -1
27
+ min_samples_threshold: -1
28
+ random_state: 42
29
+
30
+ save_dir: /mnt/ML/models/GPT-SoVITS/vad_specific/vad_scoring_model/scorer/
31
+ save_interval_epoch: 1
32
+ logging_interval: 100
33
+ save_interval_steps: -1
34
+
35
+ model_version: v3s
36
+ model_id: mkrausio/EmoWhisper-AnS-Small-v0.1
37
+ out_channels: 16
38
+
39
+ kl_cycle_length: 1
40
+ kl_max_weight: 1
41
+ kl_min_weight: 1
42
+ mean_loss_weight: 1.0
43
+
44
+ loss_type: kl
scorer_v3s_16_final/vad_model_epoch_10_step_62960.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c35a33c5f7979d94f9b36fb71d5ddae7bdd09c81778a0bb0c710b78a8641b0e9
3
+ size 98373932