mconcat commited on
Commit
a385d58
·
verified ·
1 Parent(s): cb8f050

Add MTP layers to quantization_config.ignore list

Browse files
Files changed (1) hide show
  1. config.json +10 -2
config.json CHANGED
@@ -320,7 +320,15 @@
320
  "model.language_model.layers.62.linear_attn.in_proj_b",
321
  "model.language_model.layers.62.linear_attn.in_proj_a",
322
  "model.language_model.layers.63.self_attn.o_proj",
323
- "lm_head"
 
 
 
 
 
 
 
 
324
  ],
325
  "kv_cache_scheme": null,
326
  "quant_method": "compressed-tensors",
@@ -464,4 +472,4 @@
464
  },
465
  "vision_end_token_id": 248054,
466
  "vision_start_token_id": 248053
467
- }
 
320
  "model.language_model.layers.62.linear_attn.in_proj_b",
321
  "model.language_model.layers.62.linear_attn.in_proj_a",
322
  "model.language_model.layers.63.self_attn.o_proj",
323
+ "lm_head",
324
+ "mtp.fc",
325
+ "mtp.layers.0.self_attn.q_proj",
326
+ "mtp.layers.0.self_attn.k_proj",
327
+ "mtp.layers.0.self_attn.v_proj",
328
+ "mtp.layers.0.self_attn.o_proj",
329
+ "mtp.layers.0.mlp.gate_proj",
330
+ "mtp.layers.0.mlp.up_proj",
331
+ "mtp.layers.0.mlp.down_proj"
332
  ],
333
  "kv_cache_scheme": null,
334
  "quant_method": "compressed-tensors",
 
472
  },
473
  "vision_end_token_id": 248054,
474
  "vision_start_token_id": 248053
475
+ }