AndreasXi commited on
Commit
64a4c0d
·
verified ·
1 Parent(s): 375d324

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. tinymu.yaml +97 -0
tinymu.yaml ADDED
@@ -0,0 +1,97 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ train_json_files:
3
+ - data/MC/MusicCaps_train.json
4
+ - data/MC/LP_MusicCaps_MC_train.json
5
+ - data/MC/MusicCapsBinary.json
6
+ - data/MC/MusicCapsMCQ.json
7
+ - data/MC/MusicCapsDetailQA.json
8
+ - data/MC/MusicInstruct_train.json
9
+ - data/MC_NEW/MusicCapsMCQ.json
10
+ - data/MTT/LP_MusicCaps_MTT_train.json
11
+ - data/MTT/MTT_Binary.json
12
+ - data/MTT/MTT_MCQ.json
13
+ - data/MTT/OpenMU_MTT_train.json
14
+ - data/MTT_NEW/MTT_MCQ.json
15
+ - data/ASM_NEW/AudioSetMusicBinary.json
16
+ - data/ASM_NEW/AudioSetMusicMCQ.json
17
+ - data/ASM_NEW/AudioSetMusicQA.json
18
+ - data/ASM_NEW/Captioning.json
19
+ - data/FMA/FMA_Caption_Train.json
20
+ - data/FMA/FMA_QA_MIX.json
21
+ - data/FMA/FMA_QA_MIX_Part2.json
22
+ train_audio_dirs:
23
+ - ../../data/LP_MusicCaps_MC/Audio
24
+ - ../../data/LP_MusicCaps_MC/Audio
25
+ - ../../data/LP_MusicCaps_MC/Audio
26
+ - ../../data/LP_MusicCaps_MC/Audio
27
+ - ../../data/LP_MusicCaps_MC/Audio
28
+ - ../../data/LP_MusicCaps_MC/Audio
29
+ - ../../data/LP_MusicCaps_MC/Audio
30
+ - ../../data/LP_MusicCaps_MTT/Audio
31
+ - ../../data/LP_MusicCaps_MTT/Audio
32
+ - ../../data/LP_MusicCaps_MTT/Audio
33
+ - ../../data/LP_MusicCaps_MTT/Audio
34
+ - ../../data/LP_MusicCaps_MTT/Audio
35
+ - /apdcephfs_gy4/share_302507476/xiquanli/data/AudioSet/data/audio
36
+ - /apdcephfs_gy4/share_302507476/xiquanli/data/AudioSet/data/audio
37
+ - /apdcephfs_gy4/share_302507476/xiquanli/data/AudioSet/data/audio
38
+ - /apdcephfs_gy4/share_302507476/xiquanli/data/AudioSet/data/audio
39
+ - /apdcephfs_gy2/share_302507476/0_public_datasets/fma_dataset/fma_split_15s
40
+ - /apdcephfs_gy2/share_302507476/0_public_datasets/fma_dataset/fma_split_15s
41
+ - /apdcephfs_gy2/share_302507476/0_public_datasets/fma_dataset/fma_split_15s
42
+ val_json_files:
43
+ - data/captioning/MusicCaps_test.json
44
+ val_audio_dirs:
45
+ - ../../data/LP_MusicCaps_MC/Audio
46
+ sample_rate: 32000
47
+ max_length: 10
48
+ tokenizer_type: HuggingFaceTB/SmolLM2-135M
49
+ max_text_token_len: 129
50
+ batch_size: 16
51
+ num_workers: 8
52
+ wav_aug: false
53
+ model:
54
+ encoder:
55
+ audioenc_name: MATPAC
56
+ matpac_ckpt_path: ./weights/matpac_plus_as_48_1_map_enconly.pt
57
+ freeze: true
58
+ ds_rate: 1
59
+ c2l_first: true
60
+ wo_repeat: true
61
+ projector:
62
+ proj_name: linearprojector
63
+ d_in: 3840
64
+ d_h: 2048
65
+ d_out: 576
66
+ decoder:
67
+ textdec_name: HuggingFaceTB/SmolLM2-135M
68
+ max_text_token_len: 129
69
+ freeze: false
70
+ use_lora: false
71
+ lora_config:
72
+ r: 32
73
+ lora_alpha: 128
74
+ lora_dropout: 0.1
75
+ bias: none
76
+ target_modules:
77
+ - q_proj
78
+ - v_proj
79
+ model_type: m2t
80
+ training:
81
+ epochs: 3
82
+ clip_grad: 2
83
+ dropout: 0.2
84
+ seed: 42
85
+ device: cuda
86
+ validation_step: 3000
87
+ optim_args:
88
+ lr: 0.0001
89
+ warmup_steps: 0
90
+ scheduler: cosine
91
+ optimizer_name: adam
92
+ betas:
93
+ - 0.9
94
+ - 0.999
95
+ eps: 1.0e-08
96
+ momentum: 0.9
97
+ warmup_ratio: 0.05