Add MTP layers to quantization_config.ignore list
Browse files- config.json +10 -2
config.json
CHANGED
|
@@ -320,7 +320,15 @@
|
|
| 320 |
"model.language_model.layers.62.linear_attn.in_proj_b",
|
| 321 |
"model.language_model.layers.62.linear_attn.in_proj_a",
|
| 322 |
"model.language_model.layers.63.self_attn.o_proj",
|
| 323 |
-
"lm_head"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 324 |
],
|
| 325 |
"kv_cache_scheme": null,
|
| 326 |
"quant_method": "compressed-tensors",
|
|
@@ -464,4 +472,4 @@
|
|
| 464 |
},
|
| 465 |
"vision_end_token_id": 248054,
|
| 466 |
"vision_start_token_id": 248053
|
| 467 |
-
}
|
|
|
|
| 320 |
"model.language_model.layers.62.linear_attn.in_proj_b",
|
| 321 |
"model.language_model.layers.62.linear_attn.in_proj_a",
|
| 322 |
"model.language_model.layers.63.self_attn.o_proj",
|
| 323 |
+
"lm_head",
|
| 324 |
+
"mtp.fc",
|
| 325 |
+
"mtp.layers.0.self_attn.q_proj",
|
| 326 |
+
"mtp.layers.0.self_attn.k_proj",
|
| 327 |
+
"mtp.layers.0.self_attn.v_proj",
|
| 328 |
+
"mtp.layers.0.self_attn.o_proj",
|
| 329 |
+
"mtp.layers.0.mlp.gate_proj",
|
| 330 |
+
"mtp.layers.0.mlp.up_proj",
|
| 331 |
+
"mtp.layers.0.mlp.down_proj"
|
| 332 |
],
|
| 333 |
"kv_cache_scheme": null,
|
| 334 |
"quant_method": "compressed-tensors",
|
|
|
|
| 472 |
},
|
| 473 |
"vision_end_token_id": 248054,
|
| 474 |
"vision_start_token_id": 248053
|
| 475 |
+
}
|