{ "format": "TQ4_1S", "version": 1, "model_info": {}, "quantization": {}, "tensors": [ { "name": "model_layers_15_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_15_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_8_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_8_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_15_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_15_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_21_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_3_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_16_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_11_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_23_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_2_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_12_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_12_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_23_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_11_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_3_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_4_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_19_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_21_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_21_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_1_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_1_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_11_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_11_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_17_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_20_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_19_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_19_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_12_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_6_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_6_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_2_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_8_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_6_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_18_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_20_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_20_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_6_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_2_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_19_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_19_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_22_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_17_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_17_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_21_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_15_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_15_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_10_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_14_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_14_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_21_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_11_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_11_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_16_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_11_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_13_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_14_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_16_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_5_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_10_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_5_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_5_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_20_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_2_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_1_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_1_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_20_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_6_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_14_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_14_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_1_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_7_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_10_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_10_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_15_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_23_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_15_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_17_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_21_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_0_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_19_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_17_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_3_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_4_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_21_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_21_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_2_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_22_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_7_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_15_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_15_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_20_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_18_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_22_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_22_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_22_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_3_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_3_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_2_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_17_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_1_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_4_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_14_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_16_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_16_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_8_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_18_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_9_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_6_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_13_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_13_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_15_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_15_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_22_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_23_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_23_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_3_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_0_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_20_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_20_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_20_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_14_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_14_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_22_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_19_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_19_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_10_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_23_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_21_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_21_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_15_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_12_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_1_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_0_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_16_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_5_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_23_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_16_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_1_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_7_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_14_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_14_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_14_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_18_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_23_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_0_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_10_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_9_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_3_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_9_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_22_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_22_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_0_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_14_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_11_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_11_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_7_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_5_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_5_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_19_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_5_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_11_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_11_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_5_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_17_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_3_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_3_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_0_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_13_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_11_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_4_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_17_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_17_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_10_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_12_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_17_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_9_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_2_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_2_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_4_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_6_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_23_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_16_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_5_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_18_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_18_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_1_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_0_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_8_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_8_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_23_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_18_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_18_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_13_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_9_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_22_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_4_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_8_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_0_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_8_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_6_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_13_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_13_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_1_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_12_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_12_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_10_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_10_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_15_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_9_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_8_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_13_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_2_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_2_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_7_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_3_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_23_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_22_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_9_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_19_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_16_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_16_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_9_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_13_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_1_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_16_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_6_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_6_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_2_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_6_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_10_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_10_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_8_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_6_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_17_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_14_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_11_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_11_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_4_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_5_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_23_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_23_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_18_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_18_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_4_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_2_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_18_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_10_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_9_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_19_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_7_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_18_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_18_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_20_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_3_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_21_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_17_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_14_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_14_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_21_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_9_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_9_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_14_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_8_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_1_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_1_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_0_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_0_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_4_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_3_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_13_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_1_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_3_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_22_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_norm_weight", "shape": [ 896 ], "file": "model_norm_weight.quant", "original_size": 0 }, { "name": "model_embed_tokens_weight", "shape": [ 151936, 896 ], "file": "model_embed_tokens_weight.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_11_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_17_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_17_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_12_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_12_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_11_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_12_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_16_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_23_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_23_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_7_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_15_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_15_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_13_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_13_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_12_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_12_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_18_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_18_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_13_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_13_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_20_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_13_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_13_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_3_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_3_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_8_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_19_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_16_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_6_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_6_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_7_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_21_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_21_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_22_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_19_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_19_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_21_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_21_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_8_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_12_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_11_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_11_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_19_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_19_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_7_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_7_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_5_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_9_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_18_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_19_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_19_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_13_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_13_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_7_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_7_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_post_attention_layernorm_weight", "shape": [ 896 ], "file": "model_layers_0_post_attention_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_12_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_7_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_7_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_10_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_10_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_21_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_21_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_22_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_22_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_8_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_8_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_20_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_q_proj_bias", "shape": [ 896 ], "file": "model_layers_20_self_attn_q_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_18_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_18_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_4_mlp_down_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_o_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_4_self_attn_o_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_20_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_20_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_14_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_14_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_17_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_17_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_input_layernorm_weight", "shape": [ 896 ], "file": "model_layers_2_input_layernorm_weight.quant", "original_size": 0 }, { "name": "model_layers_5_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_5_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_2_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_2_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_mlp_up_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_0_mlp_up_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_0_mlp_gate_proj_weight", "shape": [ 4864, 896 ], "file": "model_layers_0_mlp_gate_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_9_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_9_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_5_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_5_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_15_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_15_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_4_self_attn_k_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_4_self_attn_k_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_1_self_attn_q_proj_weight", "shape": [ 896, 896 ], "file": "model_layers_1_self_attn_q_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_16_self_attn_k_proj_bias", "shape": [ 128 ], "file": "model_layers_16_self_attn_k_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_7_self_attn_v_proj_weight", "shape": [ 128, 896 ], "file": "model_layers_7_self_attn_v_proj_weight.quant", "original_size": 0 }, { "name": "model_layers_12_self_attn_v_proj_bias", "shape": [ 128 ], "file": "model_layers_12_self_attn_v_proj_bias.quant", "original_size": 0 }, { "name": "model_layers_12_mlp_down_proj_weight", "shape": [ 896, 4864 ], "file": "model_layers_12_mlp_down_proj_weight.quant", "original_size": 0 } ] }