Files changed (1) hide show
  1. config.json +3 -124
config.json CHANGED
@@ -35,130 +35,9 @@
35
  "quantization_config": {
36
  "algo_config": null,
37
  "exclude": [
38
- "model.layers.0.self_attn.indexer.weights_proj.weight",
39
- "model.layers.1.self_attn.indexer.weights_proj.weight",
40
- "model.layers.2.self_attn.indexer.weights_proj.weight",
41
- "model.layers.3.self_attn.indexer.weights_proj.weight",
42
- "model.layers.4.self_attn.indexer.weights_proj.weight",
43
- "model.layers.5.self_attn.indexer.weights_proj.weight",
44
- "model.layers.6.self_attn.indexer.weights_proj.weight",
45
- "model.layers.7.self_attn.indexer.weights_proj.weight",
46
- "model.layers.8.self_attn.indexer.weights_proj.weight",
47
- "model.layers.9.self_attn.indexer.weights_proj.weight",
48
- "model.layers.10.self_attn.indexer.weights_proj.weight",
49
- "model.layers.11.self_attn.indexer.weights_proj.weight",
50
- "model.layers.12.self_attn.indexer.weights_proj.weight",
51
- "model.layers.13.self_attn.indexer.weights_proj.weight",
52
- "model.layers.14.self_attn.indexer.weights_proj.weight",
53
- "model.layers.15.self_attn.indexer.weights_proj.weight",
54
- "model.layers.16.self_attn.indexer.weights_proj.weight",
55
- "model.layers.17.self_attn.indexer.weights_proj.weight",
56
- "model.layers.18.self_attn.indexer.weights_proj.weight",
57
- "model.layers.19.self_attn.indexer.weights_proj.weight",
58
- "model.layers.20.self_attn.indexer.weights_proj.weight",
59
- "model.layers.21.self_attn.indexer.weights_proj.weight",
60
- "model.layers.22.self_attn.indexer.weights_proj.weight",
61
- "model.layers.23.self_attn.indexer.weights_proj.weight",
62
- "model.layers.24.self_attn.indexer.weights_proj.weight",
63
- "model.layers.25.self_attn.indexer.weights_proj.weight",
64
- "model.layers.26.self_attn.indexer.weights_proj.weight",
65
- "model.layers.27.self_attn.indexer.weights_proj.weight",
66
- "model.layers.28.self_attn.indexer.weights_proj.weight",
67
- "model.layers.29.self_attn.indexer.weights_proj.weight",
68
- "model.layers.30.self_attn.indexer.weights_proj.weight",
69
- "model.layers.31.self_attn.indexer.weights_proj.weight",
70
- "model.layers.32.self_attn.indexer.weights_proj.weight",
71
- "model.layers.33.self_attn.indexer.weights_proj.weight",
72
- "model.layers.34.self_attn.indexer.weights_proj.weight",
73
- "model.layers.35.self_attn.indexer.weights_proj.weight",
74
- "model.layers.36.self_attn.indexer.weights_proj.weight",
75
- "model.layers.37.self_attn.indexer.weights_proj.weight",
76
- "model.layers.38.self_attn.indexer.weights_proj.weight",
77
- "model.layers.39.self_attn.indexer.weights_proj.weight",
78
- "model.layers.40.self_attn.indexer.weights_proj.weight",
79
- "model.layers.41.self_attn.indexer.weights_proj.weight",
80
- "model.layers.42.self_attn.indexer.weights_proj.weight",
81
- "model.layers.43.self_attn.indexer.weights_proj.weight",
82
- "model.layers.44.self_attn.indexer.weights_proj.weight",
83
- "model.layers.45.self_attn.indexer.weights_proj.weight",
84
- "model.layers.46.self_attn.indexer.weights_proj.weight",
85
- "model.layers.47.self_attn.indexer.weights_proj.weight",
86
- "model.layers.48.self_attn.indexer.weights_proj.weight",
87
- "model.layers.49.self_attn.indexer.weights_proj.weight",
88
- "model.layers.50.self_attn.indexer.weights_proj.weight",
89
- "model.layers.51.self_attn.indexer.weights_proj.weight",
90
- "model.layers.52.self_attn.indexer.weights_proj.weight",
91
- "model.layers.53.self_attn.indexer.weights_proj.weight",
92
- "model.layers.54.self_attn.indexer.weights_proj.weight",
93
- "model.layers.55.self_attn.indexer.weights_proj.weight",
94
- "model.layers.56.self_attn.indexer.weights_proj.weight",
95
- "model.layers.57.self_attn.indexer.weights_proj.weight",
96
- "model.layers.58.self_attn.indexer.weights_proj.weight",
97
- "model.layers.59.self_attn.indexer.weights_proj.weight",
98
- "model.layers.60.self_attn.indexer.weights_proj.weight",
99
- "model.layers.61.self_attn.indexer.weights_proj.weight",
100
- "model.layers.3.mlp.gate.weight",
101
- "model.layers.4.mlp.gate.weight",
102
- "model.layers.5.mlp.gate.weight",
103
- "model.layers.6.mlp.gate.weight",
104
- "model.layers.7.mlp.gate.weight",
105
- "model.layers.8.mlp.gate.weight",
106
- "model.layers.9.mlp.gate.weight",
107
- "model.layers.10.mlp.gate.weight",
108
- "model.layers.11.mlp.gate.weight",
109
- "model.layers.12.mlp.gate.weight",
110
- "model.layers.13.mlp.gate.weight",
111
- "model.layers.14.mlp.gate.weight",
112
- "model.layers.15.mlp.gate.weight",
113
- "model.layers.16.mlp.gate.weight",
114
- "model.layers.17.mlp.gate.weight",
115
- "model.layers.18.mlp.gate.weight",
116
- "model.layers.19.mlp.gate.weight",
117
- "model.layers.20.mlp.gate.weight",
118
- "model.layers.21.mlp.gate.weight",
119
- "model.layers.22.mlp.gate.weight",
120
- "model.layers.23.mlp.gate.weight",
121
- "model.layers.24.mlp.gate.weight",
122
- "model.layers.25.mlp.gate.weight",
123
- "model.layers.26.mlp.gate.weight",
124
- "model.layers.27.mlp.gate.weight",
125
- "model.layers.28.mlp.gate.weight",
126
- "model.layers.29.mlp.gate.weight",
127
- "model.layers.30.mlp.gate.weight",
128
- "model.layers.31.mlp.gate.weight",
129
- "model.layers.32.mlp.gate.weight",
130
- "model.layers.33.mlp.gate.weight",
131
- "model.layers.34.mlp.gate.weight",
132
- "model.layers.35.mlp.gate.weight",
133
- "model.layers.36.mlp.gate.weight",
134
- "model.layers.37.mlp.gate.weight",
135
- "model.layers.38.mlp.gate.weight",
136
- "model.layers.39.mlp.gate.weight",
137
- "model.layers.40.mlp.gate.weight",
138
- "model.layers.41.mlp.gate.weight",
139
- "model.layers.42.mlp.gate.weight",
140
- "model.layers.43.mlp.gate.weight",
141
- "model.layers.44.mlp.gate.weight",
142
- "model.layers.45.mlp.gate.weight",
143
- "model.layers.46.mlp.gate.weight",
144
- "model.layers.47.mlp.gate.weight",
145
- "model.layers.48.mlp.gate.weight",
146
- "model.layers.49.mlp.gate.weight",
147
- "model.layers.50.mlp.gate.weight",
148
- "model.layers.51.mlp.gate.weight",
149
- "model.layers.52.mlp.gate.weight",
150
- "model.layers.53.mlp.gate.weight",
151
- "model.layers.54.mlp.gate.weight",
152
- "model.layers.55.mlp.gate.weight",
153
- "model.layers.56.mlp.gate.weight",
154
- "model.layers.57.mlp.gate.weight",
155
- "model.layers.58.mlp.gate.weight",
156
- "model.layers.59.mlp.gate.weight",
157
- "model.layers.60.mlp.gate.weight",
158
- "model.layers.61.mlp.gate.weight",
159
- "lm_head",
160
- "model.layers.61.eh_proj.weight",
161
- "model.layers.61.shared_head.head"
162
  ],
163
  "export": {
164
  "kv_cache_group": [],
 
35
  "quantization_config": {
36
  "algo_config": null,
37
  "exclude": [
38
+ "model.layers.61.eh_proj",
39
+ "model.layers.61.shared_head.head",
40
+ "lm_head"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
41
  ],
42
  "export": {
43
  "kv_cache_group": [],