andrewqin commited on
Commit
1431c8f
·
verified ·
1 Parent(s): b73ec4e

Upload LoRA adapter

Browse files
Files changed (1) hide show
  1. adapter_config.json +144 -0
adapter_config.json ADDED
@@ -0,0 +1,144 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "meta-llama/Llama-3.1-8B-Instruct",
5
+ "bias": "none",
6
+ "corda_config": null,
7
+ "eva_config": null,
8
+ "exclude_modules": null,
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": true,
12
+ "layer_replication": null,
13
+ "layers_pattern": null,
14
+ "layers_to_transform": null,
15
+ "loftq_config": {},
16
+ "lora_alpha": 64,
17
+ "lora_bias": false,
18
+ "lora_dropout": 0.05,
19
+ "megatron_config": null,
20
+ "megatron_core": "megatron.core",
21
+ "modules_to_save": null,
22
+ "peft_type": "LORA",
23
+ "r": 32,
24
+ "rank_pattern": {},
25
+ "revision": null,
26
+ "target_modules": [
27
+ "model.layers.20.self_attn.q_proj",
28
+ "model.layers.19.mlp.down_proj",
29
+ "model.layers.24.mlp.down_proj",
30
+ "model.layers.22.mlp.down_proj",
31
+ "model.layers.16.mlp.gate_proj",
32
+ "model.layers.24.self_attn.v_proj",
33
+ "model.layers.28.mlp.up_proj",
34
+ "model.layers.28.self_attn.v_proj",
35
+ "model.layers.23.mlp.up_proj",
36
+ "model.layers.27.self_attn.k_proj",
37
+ "model.layers.23.self_attn.v_proj",
38
+ "model.layers.25.self_attn.o_proj",
39
+ "model.layers.19.self_attn.q_proj",
40
+ "model.layers.28.self_attn.k_proj",
41
+ "model.layers.20.self_attn.k_proj",
42
+ "model.layers.25.self_attn.v_proj",
43
+ "model.layers.18.self_attn.o_proj",
44
+ "model.layers.23.mlp.down_proj",
45
+ "model.layers.21.self_attn.k_proj",
46
+ "model.layers.22.mlp.up_proj",
47
+ "model.layers.22.self_attn.o_proj",
48
+ "model.layers.26.mlp.up_proj",
49
+ "model.layers.17.self_attn.v_proj",
50
+ "model.layers.20.self_attn.v_proj",
51
+ "model.layers.20.self_attn.o_proj",
52
+ "model.layers.23.self_attn.q_proj",
53
+ "model.layers.19.mlp.gate_proj",
54
+ "model.layers.24.self_attn.q_proj",
55
+ "model.layers.26.self_attn.o_proj",
56
+ "model.layers.30.self_attn.v_proj",
57
+ "model.layers.18.mlp.down_proj",
58
+ "model.layers.24.self_attn.o_proj",
59
+ "model.layers.19.self_attn.k_proj",
60
+ "model.layers.24.mlp.up_proj",
61
+ "model.layers.16.mlp.up_proj",
62
+ "model.layers.19.mlp.up_proj",
63
+ "model.layers.20.mlp.down_proj",
64
+ "model.layers.26.self_attn.v_proj",
65
+ "model.layers.29.self_attn.q_proj",
66
+ "model.layers.17.mlp.up_proj",
67
+ "model.layers.20.mlp.up_proj",
68
+ "model.layers.18.self_attn.v_proj",
69
+ "model.layers.21.mlp.up_proj",
70
+ "model.layers.29.mlp.up_proj",
71
+ "model.layers.30.mlp.gate_proj",
72
+ "model.layers.21.mlp.gate_proj",
73
+ "model.layers.27.mlp.gate_proj",
74
+ "model.layers.28.mlp.gate_proj",
75
+ "model.layers.26.self_attn.q_proj",
76
+ "model.layers.30.mlp.up_proj",
77
+ "model.layers.20.mlp.gate_proj",
78
+ "model.layers.31.mlp.up_proj",
79
+ "model.layers.28.self_attn.o_proj",
80
+ "model.layers.16.self_attn.k_proj",
81
+ "model.layers.25.mlp.up_proj",
82
+ "model.layers.22.self_attn.v_proj",
83
+ "model.layers.29.mlp.down_proj",
84
+ "model.layers.30.self_attn.q_proj",
85
+ "model.layers.17.self_attn.o_proj",
86
+ "model.layers.25.mlp.down_proj",
87
+ "model.layers.17.mlp.down_proj",
88
+ "model.layers.23.self_attn.k_proj",
89
+ "model.layers.23.self_attn.o_proj",
90
+ "model.layers.24.self_attn.k_proj",
91
+ "model.layers.23.mlp.gate_proj",
92
+ "model.layers.25.self_attn.k_proj",
93
+ "model.layers.31.self_attn.q_proj",
94
+ "model.layers.27.mlp.down_proj",
95
+ "model.layers.21.self_attn.q_proj",
96
+ "model.layers.26.mlp.gate_proj",
97
+ "model.layers.16.self_attn.q_proj",
98
+ "model.layers.27.self_attn.o_proj",
99
+ "model.layers.29.mlp.gate_proj",
100
+ "model.layers.28.mlp.down_proj",
101
+ "model.layers.22.self_attn.k_proj",
102
+ "model.layers.27.mlp.up_proj",
103
+ "model.layers.16.mlp.down_proj",
104
+ "model.layers.26.self_attn.k_proj",
105
+ "model.layers.17.mlp.gate_proj",
106
+ "model.layers.21.self_attn.v_proj",
107
+ "model.layers.27.self_attn.v_proj",
108
+ "model.layers.18.self_attn.k_proj",
109
+ "model.layers.19.self_attn.o_proj",
110
+ "model.layers.17.self_attn.k_proj",
111
+ "model.layers.21.mlp.down_proj",
112
+ "model.layers.17.self_attn.q_proj",
113
+ "model.layers.29.self_attn.v_proj",
114
+ "model.layers.31.self_attn.v_proj",
115
+ "model.layers.31.self_attn.k_proj",
116
+ "model.layers.31.self_attn.o_proj",
117
+ "model.layers.18.mlp.up_proj",
118
+ "model.layers.27.self_attn.q_proj",
119
+ "model.layers.26.mlp.down_proj",
120
+ "model.layers.30.self_attn.o_proj",
121
+ "model.layers.21.self_attn.o_proj",
122
+ "model.layers.19.self_attn.v_proj",
123
+ "model.layers.29.self_attn.k_proj",
124
+ "model.layers.24.mlp.gate_proj",
125
+ "model.layers.25.mlp.gate_proj",
126
+ "model.layers.22.self_attn.q_proj",
127
+ "model.layers.16.self_attn.o_proj",
128
+ "model.layers.30.self_attn.k_proj",
129
+ "model.layers.31.mlp.down_proj",
130
+ "model.layers.30.mlp.down_proj",
131
+ "model.layers.25.self_attn.q_proj",
132
+ "model.layers.18.mlp.gate_proj",
133
+ "model.layers.22.mlp.gate_proj",
134
+ "model.layers.31.mlp.gate_proj",
135
+ "model.layers.18.self_attn.q_proj",
136
+ "model.layers.28.self_attn.q_proj",
137
+ "model.layers.16.self_attn.v_proj",
138
+ "model.layers.29.self_attn.o_proj"
139
+ ],
140
+ "task_type": "CAUSAL_LM",
141
+ "trainable_token_indices": null,
142
+ "use_dora": false,
143
+ "use_rslora": false
144
+ }