diff --git a/.gitattributes b/.gitattributes index fdbd3454376055504bbe24352679924242364f1d..634afd037d358cf3ab28bca1d3f5babc9367e5de 100644 --- a/.gitattributes +++ b/.gitattributes @@ -2517,3 +2517,251 @@ qwen3-4b-thinking-unary/model_layers_27_self_attn_v_proj_weight.planes filter=lf qwen3-4b-thinking-unary/model_layers_16_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text qwen3-4b-thinking-unary/model_layers_27_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text qwen3-4b-thinking-hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_embed_tokens_weight.fp16 filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/tokenizer.json filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-unary4/lm_head_weight.fp16 filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_14_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_0_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_20_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_25_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_27_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_26_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_6_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_24_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_13_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_11_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_9_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_19_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_13_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_21_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_7_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_16_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_6_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_15_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_17_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_15_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_11_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_19_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_0_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_10_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_1_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_20_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_4_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_2_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_9_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_13_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_18_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_8_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_20_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_27_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_24_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_2_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_12_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_27_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_22_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_27_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_16_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_9_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_16_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text diff --git a/deepseek-r1-1.5b-gunary/model_layers_0_self_attn_v_proj_bias.fp16 b/deepseek-r1-1.5b-gunary/model_layers_0_self_attn_v_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..5837e3fe1a534632322c5961f2b75f7c554f88c3 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_0_self_attn_v_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_v_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_v_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..0f58abe71703255d03b9b1473027996c0c5a505e Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_v_proj_weight.gscales differ diff --git a/deepseek-r1-1.5b-ternary/model_layers_0_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_0_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..cddddbeb72cb7e5015bde4d5b7250ebb9cc24de6 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_0_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b5378fb65b0e6d38e4c3a2fd3cd08a64569b3da596e2234978d0ec3a77167c +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..38a862dd77d5222b37a02984056ba2b96215df0a --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e94b58948e74314e1d27ac9d61975b860653f61b2d8eff06f86fd37227a4aa1 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..888bf53d0746ff4d0fba610731941023f6573f62 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_0_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619e625042427c3932cd491fa909817245c376ba32044a6f2e0808905357bb1b +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..809cfcbda3a544424583001f9a4a49f9ce47d6a2 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccc575264a29da098da3b78559db3a84a2129c3e9bb8ea31786b466b88a3b1a3 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..3d54fd368a911b9378f94133a8a0f64daca8e7bc --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bba743450b99b08d9845f481c95f41edfbff94952d32dbf80805f9d550ceb2a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..77b4fe60b7204b12f1612ce54a407137aa3c3fa6 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_0_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff97d6db7c10a4cd5f316c5c2957a33ff5a57b2eec02e1078c37c99fbc8d4c25 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_10_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_10_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..2b93534364fbcfb048dba3e6e378653d8bdb6395 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_10_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24bf7cc352024d1f603d250a201bd571a006a93bcd1bc8e439bd58682c6f4492 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..7f9f2b830dad949d5620f64e52cdce0ddee6971f --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef669b8b552a13a80c39cb2b8f1a363b8aa2988535ccddd56775dbf7166bc528 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_11_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_11_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..c6ff29dd3bb94286a1d4aa5c8de7f49e8c68dd74 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_11_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cf1fdca9ce2aa0911aee4f80032b508a4116142562b27f0e0e0a0fc3282b3e0 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_11_self_attn_q_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_11_self_attn_q_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..0c22a099d6cd66123370944dbfa292b93a1dc885 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_11_self_attn_q_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48b6cd43aee887243f539411a83873aa00711d030227035d3aed7ababb087f38 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_12_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_12_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..65d44bc7f357b44f0e3947c9958295b777eca4ae --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_12_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf86395ecb72d04d8a2617afc0ee6c8e3e72b7c0e2fad8204661ba3256c41c2 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_13_mlp_gate_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_13_mlp_gate_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..ce4efd7ad70c942d77ef528e20a2a101902a57c5 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_13_mlp_gate_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd16801e5491bd2372fea8435e0bdeda3d7d7d08e420e0a28d09fd98c850227 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_13_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_13_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..e64f42f11cfaf8dce427a36d1b9002400f00e6ed --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_13_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:587a574229e63174f4bdf31a07eb21997e85d7da551bedb6a6ac2be6d18dcbb6 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..8bd3ee3e9cc34d5301757ddde961d9d472794c84 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571fbb793c19c519e2d9c484d9b7aad9a22818e028a3f4441d89f608e338fd3a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..382e46689aeb807b2e5a8f895a8fbfe8b43182d6 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f592d4ef97653f3812b5ca724a90a6b9c10fe31974e5ff71389418f8920f3e6e +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..596cddc9fdaa579a3090e1d06fff0a9a2ec9d4ae --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_13_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fff537c8f38887b82083aecbed92b2b8dc5a4a375829b2760bfce08719b7d69 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_14_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_14_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..6b65e9dddfc1cc192f2a852444c14f210206cc25 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_14_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372be321f22dc5de9163ba84cf3ac48ba63d8e609c420506cad54496b5ec6657 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..25a42274ab90e363513b4b6118f6709d29cc1282 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3c3d41f6d48e751e948114a1a007b9276233eccb276431bf4c7fe6038eca45 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_15_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_15_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..0dfc2adeef7aa3d0b5599d28e7dc662a960902e2 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_15_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6641a6a35a20d1af81b9d867ddfb4c00818a5cd48f31b8a1c5d32a0209ece15 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_15_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_15_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..8b020b3cb24bbdbc76f812406d4ce0b8a619d409 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_15_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4078bb99a0aa1df7f10e5ce704b0ac390c1b4b50c3ee3e879aa9086d665161ba +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_16_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_16_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..6d1a83f387b15a5e597873076dc8c0646466b027 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_16_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a201cdbaddcabd2c3fae11ed6ffb1494148b1d3767376b0b09e9ba77744e152 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_16_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_16_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..bd3f3fdd115881ddff47307c49505aecb8dab30b --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_16_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8866573a7730031f6727f2032b14d5aa529409ac0c6cba986e5af22d0535efbe +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_16_self_attn_q_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_16_self_attn_q_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..2d9a3dd75c7f59226fdf02493d166da42d9a364d --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_16_self_attn_q_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc5882cf2984a217980345db159e3ea819570f1bb32d6433d0cdcf65a179b1a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_17_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_17_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..3a410b65bce3bed7b48771249efcf353f1203525 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_17_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e324e2d9752680c667336f4839fb14945ce040822ecda3ac04f027e9460a633 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..ded83ca223dc328cdbc95afb8a8e03fe0de2975b --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65cd692f72c985a5ed909fb22f3c7ed8fd58e7d988bfbe6310412bd98e15dc0d +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..7f2d226c0934c0d2c83577eff5d920919984838e --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_17_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ca656ff67f1fc3b77de0fc890f1a6894986fc636d3e463db71174dd7a81a35 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_18_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_18_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..808e3b3fcb33ea322bc29454b31e23b535a4c1de --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_18_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79eff64b79119e79b984b5c24266b1dbbe38d0a0b6b2b48a46fb07baf880a852 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_19_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_19_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..bf1061527a9955884695eea2c77c302f4e30a09c --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_19_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0f0c308526d3c68c4a3efa7bbf0522de8b386f5be88eed57639603a9d1aa34 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..361ca774406a34364bd0ba52edd7e9fb0e5604ef --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b64e1a4e3ed8cd45f20658f5cd9f18868d597c95a53fe539aca9ce59ab313b +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..751d1177faff2d0b7332ae71668398fd053a822c --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b0665c7bfb81ddf41f3ad80e246fdf911545661dfbc6f29ed777cf2b7f0670 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_19_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_19_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..72e3dcab01b1b37937f5e004867e0f6457ff5839 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_19_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a37b742d18df0955e555127edc50b6e73070876803dca865adac46281c022170 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_1_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_1_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..15e6f88a74dc23466e7124d85e114a114524c06e --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_1_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c65dc2de71d3f2559859f7acb5e114d1ca7f979823f440367a4ea51a46c09a +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_20_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_20_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..508d0067639e7850eab6794443b71bedf94b5542 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_20_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff6e71a912d5918547f7c4cdeb3a8d26f7f80b7609cc22a9d5d8bf0499c8578 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_20_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_20_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..bc76f9cf30197eb9c2f5e79fceb4f25f73c8587c --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_20_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588a0380cbabf1fcdc291a40380213d8c5cb9cc5329768d80718983903622362 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_20_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_20_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..76e5775452b99d12c1adfdd748da597b3de3087d --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_20_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ff6b610d0d4058d83bb7280ad98c420f57f7c3f02828710fb3720f24394b5b +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_21_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_21_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..e832261e624e75fcf2200f71e059b65c81c6b764 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_21_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae898f8a79728c4e184db10d9338ea1ba4f61c2d38736bb8c563839d914e65c +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..0abc3da7c8ccb38946da6e545f262b31ecb51dcd --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6055ae0ae1b27830e11982c2c86d637ffa72044b675dd9671c06d9ea60fb7e25 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_22_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_22_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..7baccea9e2d8785ac58762c8b1be21060886dd9b --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_22_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c5b45ca1dfc8383125f0fffc08b7e0d6fb3198c74325bf872483c7405f8f0bf +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..ee51e316abb4d15282677f8aceffb498ecb4bca3 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2afa608693bb6606d2beb3ba03bf8c5847e0ba9b2cce90316450a73d6e386626 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..4bd45c3ce8b1426f120ebb536a94f251a7292ac7 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_24_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52069b7f6101270114ef09f329bf22e4827afba6bc354921db023662981af3f +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_24_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_24_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..af291915b4212171cee9d6ff06872c27a7860431 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_24_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4743b0b02dd129335accb1f0c236190ad3fa2014df56af9e97e9f3fffe44081 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_24_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_24_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..ca358bd8c3f865eca97595cfc3ff8e6bc3ad48b9 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_24_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110dd02e26377c4773b01cca3d118bc63200084be4b2ae5b9dd71e21a2919816 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_25_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_25_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..08298d9a3ad9e2eb8feff28b16c105a3b423cf55 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_25_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:599bd331611b831ceb3aa6c9dcf9191506a48ccb77b1744c0f3c1133b844e127 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..07cbc56b2875bbadc1b896aabcb69959b17cdb1d --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322de7134737d165c2473ceb53801c4dfb187438b13cc8435a4799590fbfce34 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_26_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_26_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..8a893d69c5f92adb96be0897ccc9499ef6d2c0dc --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_26_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381e3160da1b4b26877352cef55404dac99bea72065699cb6b5090c5359dfbb4 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_27_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_27_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..49f21f2c9c31cd9021e36a0884922b1f6d6aadc1 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_27_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3213ab2260679a335f28d6d365faaa41b6afad8e07ac3e43505f7f8a2f948f10 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..412d4218efbeaf32dd6a4adb2aaae1e4d693ac0e --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b43198a8b2d1d79ac1d3b5745cc36c0007b8b6503daf6807a4609a0f3e74ed5 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_27_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_27_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..dea03ea60eb1ef7ce37e594f0e7ed77fd1ff1284 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_27_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3d705c63bb6fe2d60c7ab2e26ca35aa04232c64c3da30245ece7861d01e8a1 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_27_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_27_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..044a6507e6ebb67f2c6bb470d56b0affdcaf9adb --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_27_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02628f2c1064ee2d979dea3791d83c3f90cc28fe560901c226ccbcd11272b899 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_27_self_attn_q_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_27_self_attn_q_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..f0ba8940f40f18cd0f28a2471e0e38f7f311ec76 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_27_self_attn_q_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de84f800e95204c00918c1f1effaa315300a9ffbff428bb9af3cdb2706d9252 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_2_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_2_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..ad232e26d178eaf50f3bc347c992a4d95e92393a --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_2_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a384c8faa506cbf738a4a7158a2d423a5119c89e86ceba74b6774134646b040 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_2_mlp_gate_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_2_mlp_gate_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..5ccbcec9698941e24c8cd3e60a6e1de7d16c85b4 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_2_mlp_gate_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7b726aa18f6a208eef79b3bfa7c8b921f0607cef64789fc043028818b44cf1 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..c5945a60fc579fd998e80f00c9607fe4680228a0 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd024debb8cb894651b6096cc3a1c69b4a72123b50560cda9d7a409bbc4b6aa +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..955424fcf99a0fc40c6de4cce5c28e9b7bc106b0 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e6747ea7ea791086cb1828f537c7f7100f7263a0009aae4844cfea87497cd2 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..122b7d1b1e7cf35c6918aea504c74dfe960d8150 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35a6a78fa7a03e0cdde477e4ac6792a7110a678c6579488c59734eac4b655667 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_4_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_4_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..37c981d83782e209427bac6ec7107b93a5ac50f4 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_4_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921a4d23526c48463c1cafa85010bfb9cddec23070e465fd24a6ecf9e8a3c33a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..70b9e45f1badbcf0f4cb5655a2a06b130b4b134c --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc690a5944e7374d9c31f722325a1850659429fe187f3a48cd64dba292d4d2a9 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..1c744145797bcd7460cfa59705c9713a837a95ea --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_5_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7e404998a57ab8aa524d24c0e5f7cdb65787c06fb95f2a1335583ebc5f4cb1 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..1a3ea2b912295add1dd904c5acde9a42dd9c5736 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9c061491cf36514adb4157635df0d4dd964bb35b7774c4c6be788335458549 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..b12320973608c0fe6a32d4bacdb14ec677a4ad3f --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a2ad5dde00c418ecb985c95fd6465e04972f34c0d72243131875aeff79f80a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_6_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_6_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..389af1cbd1ccf3f295916e415c4944847062f08d --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_6_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c29a59dddae6e50a0ddb95250ec374e97c1820385d72d15e1ab3fc80289504 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..b6ef9739448c5a25b5f23eb97ce60d13c0fa7bda --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867bf8e2a69d635cab5342205dcd57c4afa742590bc4e047224033757c1a8492 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_6_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_6_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..b104826763d9618e807cd8f8cdea22c257360bef --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_6_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af78c21f21a0ba37734944081e62dbdfb5cbcc58d44ce8db81beac8891acafac +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..03eb2390b3832c7c18cb7ffa56043f2929961861 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7b76f3e5ca9bf5be2faad36097591ad8ec490c8594c3c07326bbabf20474607 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_7_self_attn_q_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_7_self_attn_q_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..366edeeb18ce164e1cd63026e4ee0fc2bb6fc112 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_7_self_attn_q_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f20b20c2c4cc52d1e4eef19b6cb8e9eaee63592d519e761d6cd63d198de59e +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..1a55017fa75b8630d86e03ca7825d523e199ac15 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56be012c855c3ba35292222d8d841f3344df2710360229a5f94d84d20f6de61 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_8_mlp_gate_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_gate_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..a12330cd3cbe5454582b5187d7e9daa19aec3fbc --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_gate_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d368b8c44697f2dda8f2811d9a9b16a6c5902581feb8726024156d166bc9ad72 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..d4c42cbc4ee3781267eb0e18479a2f6b43664b0b --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f868a0d5c95adb5663fe348cc0ee334bed979ff7263188f02ffed60eff2ced +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..4b73191e529d3b6aefdf9e1d50c67b6515f4d9ac --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_8_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d71ae34c30352e913cafa3885e830f46376559d3ae9e652ee845545b33862f +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..9eb79c93a323f9382b0fa1056d336f22397a10ca --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4749eede0c102518476424a7452bad998208c5eacb12a7ef17812d38cb58de4a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..a10d12b4ebf75b2c041783b6cd15aa6098d28a9b --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_8_self_attn_o_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1c0460adf31f90eb322e76f27c19fb38482b95686781602e1679fba56deb5a +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_9_mlp_gate_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_9_mlp_gate_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..5f945f8faf35e6307b9785055c1c753ad0565960 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_9_mlp_gate_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb25fd3f9510a4c48ab4b0e8cd4dc165cc42cd03ffc3b753fe5d164fc26b3bba +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_9_mlp_up_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_9_mlp_up_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..c740e1c7cf43075d868b1dae206f87ce024f1200 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_9_mlp_up_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ceb08b9e97995202266a3645c01a118592979d16c75426a32be00d8ada7edd9 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_9_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_9_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..57750f456ce61d40057b3daf8703b271985f54f7 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_9_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9823adde2e47d781bec85cb726ed47f888477daaf3b2b4bc3714ba58db63ed65 +size 294912 diff --git a/deepseek-r1-1.5b-unary4/lm_head_weight.fp16 b/deepseek-r1-1.5b-unary4/lm_head_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..fb4af3ef304753b9796153f2bd5b599471fbca35 --- /dev/null +++ b/deepseek-r1-1.5b-unary4/lm_head_weight.fp16 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cca68befcc8201afc0eb54623dd20bd2af92acfe3cff767e6f8e6c0ddad2a397 +size 466747392 diff --git a/qwen3-4b-log-unary/model_embed_tokens_weight.fp16 b/qwen3-4b-log-unary/model_embed_tokens_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..0e8e116074a78063e54fe3e480d8e73dab1bede3 --- /dev/null +++ b/qwen3-4b-log-unary/model_embed_tokens_weight.fp16 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306877428a6e2a0b343ec77faa07dc7ea85c83af3ee0c23ecfb5a9796b3f0464 +size 777912320 diff --git a/qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..aac9f03c9b19ff851718d7c5306f17a4cb6f5ce0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403df2b65fa9eeec754dc52ce0456be49613cf837d146d4e6bcf3bb6b75cf7f0 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5c59163b99f81a9ef1e7d9de94638613dff153d8 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d77c70269351a96a32fe894b9212ea78511095b804e5bce1996ffd66d5d92a +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_0_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..833c61e809bc5013f593fd998ba1ff672f640919 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb74eb45a5b89f7139d01eb702cb9075d87169a0f71ee0d5c7a83d2f92c20781 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c1fa4f882ff946c650a47997ac312c2a8cd40c21 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8698eb4f920c89ca959864ed35d6d7158f295831d64d51ff090ee244720979 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..492efb824003ef035f7aa73853043b289c3925e2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c58415e66a04cf9a787d171b55f1c3dc746e1fc02b5551b491e610b22720e033 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..62bb36c3f39bd1695a98e5937746eee5c8d0f003 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f22f95ee858a2af79e717fd1df44caf7c62114966070c0fcb4ec492c27ad950 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..574077dbb6c79124816905a5e132e4765fefffcd --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c4744abaff7a5ccd59fc5c500a12b7ea75f4dcee911d051a933014e0c74c85 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..51295465b5beb45b86e17d1f97bc3b0ad43dde57 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0b786f7662b24fd99173cfd9145e10e62114c4472dbe379a3ef9449821943e +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e78e673dba45e9a0a6000e14182d9c7dc8476887 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df12cf1f11a698e90ad44ac92c9d629fcc16c47dbbd0b7bd120f9d9bc534dfe0 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8c24ce54e09ca1a0f48bd7b5b1c103a616455f49 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4325873cebc12fdc247d42e108e261330402087197f7a01f7676348bcfcf5a4b +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..74c3b790b01bed46fb384378817dd5d72253ed2f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34871242f8e43c193979a3b4a5372dd467733febe180c226bc6379aa937431f0 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d45cc3ede3e626373655f87732ee0eac60ebd345 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce550ecfca0f2baf1059eb68ec41e0847d1807f7154903c670318281bc6a6c6d +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..693b001af196a81c93506f18b8157951a566a54d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ba6d4ec8148bc2751e0e184d0bd78c0d24fec712fb45bbdec0ba9252ab63e5 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8431735b5ce921829a261cbe75edc7eb4361f348 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9f02ddafa47b671ffa1b17629bf5fbde4cf3df1a0b81caf33117754ee3d6cf +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9c1df0eb797fb64a9fd10ad82bf72cc499e2ebae --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a14bd047cb1aa48c665813aa944ef1e8fce3f515228ce99a932f0bcfb587c1 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9738dbc9d4a057e388e1dbff3f18b31ffa1d0d02 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4fe9b2b90f1af8f11fd70794f1e947f8745b57fcda031db549bdc13799cbfe +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..dda3df56a691c5e182e31eb655eec6c9d1211a4e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4961b3b6c570480169fe06e33ca8eb06dc11709f3d934d05ac5bb96459a58fa5 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b50e7c985b99b9881443fc2c9b9bb93b01dba15c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e72f211bbd7d79cceb467e23d82c2c392590cb65ff8a486a151bc71bd8b4f9a +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c23d1c2bc2077954fcc049bfdde2037cefc10fb6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a41bc971443f5677d5151d14355ffbe4e7fe5b81b62e6c906370c40a6a51c5 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..548cb02fb76e1f89027954d104956ef9ec8caa2e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16b8505ddcfb119d57bac898abb35d7293092dcb0e1d841f073e1e3c2de2082 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6a70a3de1a2462e5c39d3551ad6af6aa7089e055 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5f96f6273f080bfdaebd70218ac15733697fd0b8dfa4fcd7f6f4380585ddc23 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d633cceef482a5d55f8564799e75f6150b4d4eec --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d9bd1649c6fd2e8b33c6b17f376d3c045ed8284199bc152cd5b2fc6a5f64c8 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..6b637376e46ce6c8ddf2048e3359e47da815ff01 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ecace98f05eee6fee606fdb4647bcc309fb3db113272f5fbfcceeb17e23a289 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9512f1db84ebc55ff2d419cf4e1a86c3c0800a88 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582f4840a3a10d137c2c31955ac86329df413ccdaf8b7e3979cd49ac770b31f4 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3c3bea704965b6186cfbf7e9e53ca81f9243dd7a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13aedc2295d09d5fb0fc54f1957b19d7750aa8c62a60a9613765c8e0a5b4f22 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..73e2cfd2ac111b1700901247d365ff7f049a13c2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8c6edaa862f0f7f25a9134d8880261baf92a76c9763c5007fec8f54e763a8b +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..21c861470c744e36f559a0b75a199101105b610d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500f948878a92e4ef39dcb8b922030a039ed0f4935ee156e9981814cad5bad5e +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..64e1b53eec6f9c89646a46eb628ecbd4130b64a3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a141b68744889da31f511d558c03dda64a218a88c257960de089e6b3e40efb +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ebc7429c6de0d547a3c582a9a3a3d4e7474de889 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222ac74c1c141ad805950c12e3e69ec209bf68a1514e73e96b0233a504747e3a +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8dd60fe972de5489b629df12269659ab313c4a1c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fe333004ef0e48c2cb7f8c2acebadc83a04eaf97965cb3c53cb4753dfe16b3 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..2f68d0a2740154fc68c596ecc880363fc7c97628 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d13df2c99a36b205bc24b5b0355170ce39c03e735affa2c9461a149057a4375c +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5888ce59102c0aab22bf01826b7a28b7147714ff --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9225a860d5b0ac0c6a856882e27ee6da36bc68b9b16c6aab2bb03c71b9a38830 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a5a4bd31c02ef682930039680d82707c4755c070 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b349f43e2236d6d8bb557963d8ef4946ae3884306d7418d26783bff8038316 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..10c47943eee5475ebfc207b550fe0684f2aee995 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00afecb135e7d9642dec0e4689a191ccd94d6c27596f31365e7314146a19f492 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f2b8e31b81c64591709cc5f32f52c1d5a6ae94f0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d3be5da5b58a14a8fd2647dda80caa80f60585aee431010a27f17007a7f08e +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cf101505b3f896d26031256963d3415638efad67 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77120e48651afe0c281b6dc397f0ca7a8681124e9d5c4bfb52051c180ec01d0d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_17_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..71acee2be8420ff7f6e095a879fb81e991b19052 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33440a70e322cad1af346f10177e7d378f3515555d2f9d6648ccbf6c6d222aba +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f6875e9d1fb0d48e1559afdb9edc021946b65076 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9eba97d895f11662cfc94115deda24c09e85aa9a6533d6e37dd524bcf3e6e9 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..727e9b5d99f6db34110290180dfdf3c10ab92f64 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b950c6d00697373b0377e3c1c745a7c715bd48a733ef05d6458bbea6d2ccba5 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..32854bef6f94b4383decfd85ec4fb37eb8294bf3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59fa864ceb61f9a669e8eb87f7bb7e540c5859266f9e1a2f18ab5733d70fc21c +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a7bf9bbefa32e8f9075757d94b92f76bc4e3062d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1df1d2c4480e18b76e43c1553831b8f11a3476595a4ef0f8443fff03aebb9a1 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_18_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2428e96ae452bd7f40d077472423ae69c935a841 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1df0d9c428e5765105b99eda1c120ac34dd53a40eded870f987050b48607a6 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..081d0c423c7b254e2db3ffeac5fc2fca82bb5578 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10c9d2ce54f687e353a2c2817f085da56ac40cb8fa7b6b2579c9124d3275f00 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..024669d535b5d70e5915a109f18425eacf37fa67 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d132ecadb65b6ffda97aa59dfa9979794b650d99512fa9cae9fc609492c1648e +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..debe4d8dcb4184ba66d7d72e37f4edc8fecc2fc2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffc719189d09bce4bbd9725e2e884de02dfd159ea53737b1975b602dc59213e +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7e6a2507aaebcaf6dec21de57c5c4bbd0d230b71 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3316c3163c2dfdfb3798f2c40dedf5fc132447fe6728d4c06507b29c0474001 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9c5098cbdc426219acbbf56a05867648253e7a74 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:945d35fae11871dbdd75db2bf836c3bbda3db8903eb38bc057e9f2a4c6eac919 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..1a4085da6bd4d2d39e21463ba1c6b5c6b18b7f2d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc402d8f5ac3c9e0e1bf6edfa18bb0765c6306e62867f979cb71810a9ef76a4 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..db6f5e113f3a692a51a5d4f65a72735bd29d9d62 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbebc2c12e4cddcd132a57bd33929afc80f185d195020cc6ba12958a8b2ee44c +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..1a5ad77ceef1ff284c2aed01ea6ab621d91c0571 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975babf3db3833910fbee35579de3db1d09d3d7aaeedb3c70e8c9bcd2ea568a5 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..84bc2eb3b3dfc74f52fb2a721430fe057d86253b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c3339b20a3eb8b03e655eccd4c71e6ba8f1d5aa0eb9b32ccb67ea2682e7b8d +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..94966a0a0a17c6eaf89cbe2fe2116aecc59a82aa --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d716da8caff37ffa01f4e434dfbc22034129d0f49a997c1bc6f6c69adb5997b3 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5aa96131c67f10e7224a60bcfa59816ab35a12ed --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9217444214b75c8802afdc56bf03fc4ce8bb9d13172881015bd44519fa280ab +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8f86d83bccc5f7450f75bdd1ee7a04c7ee1d7482 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39f42b44e2a48339ba94554030796eb9dfdb055cae74eacd966ed5f756f6d098 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2aadf8cfc74fdd59976f28992f34f58b8178803e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b840211542dfb321e43f17b079a5f4bc6802da409122e22a5b4af7e1574f9f1 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..de421b2c4c0c3d13a4cf8743f3d755b1c78a766c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956d99d35b4c963dcee65cec0a975bde1c23edfee009e9e3c066de60cc412cb9 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8135d858a3f013e243dd65b5f9e62af2cc764666 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af7363c800f6a177a98fa25073948e9d479143be58c356dce3daceae442c4545 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..50536d265a7014fd86c44367dc5045ba31f64b5c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458bd2c8eb721ae10943044e454166fd811500e716f3256d9f6fae55e4a5f08c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f5203a2318a5249194a350b1a8bd713f33f41b08 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcf6611eab27b99149297500f9dee64c9343617d95ad3a6a7f843cc3ce562f3d +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1765fc749afea5037e466b7ab19fa4dd0f362803 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bdfe38145bf018a0b79df426844804d31d9b3a3aea58d7e920885ff3be04f0d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7e543c013be58200bfa3e17f4ecda4c33751114c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:094eb7a287161b67e7318fa328067f60a88b7bbc5066e77bb99b3c98208e5933 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b517621a67e9151cef597b5353b1f608f0f8f408 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f9db4a8be96bfc20aeb4979a52502676d315b972a64fe44eae45f9acef78ee +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cf58cf9d7112139878bdf21d99a1e389d5cb8ae7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b17abbb306974e5c22c043fe331150bb49fa7d6c7ba28684474cc7381e1916c9 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0bdebd96722465956c5844dce5acbfadac38fbdb --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0cfea9a015f80f2018779b1f02906abcf198292712dd5196192cd915307c5ea +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..82a4b6fed529fed2d3371fa825fdccac4f9407b5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed10387b2b34000e10688968b61dc8b86035631be642e154d37bf79b59612cd +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5072104cb8c8af04c47b2e2aeb16dce9d11815f5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6f64ea2e7f1ef4145e95797e5c8c5b5bee0cb3accf287aef2e1b5bfc6d274e0 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4204ff55db586bd37297e111eecd467a12ef611a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e32560eaa59093738da1575a1ab1a203d2b838ae97cc512a36295e5285d1cec +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ce2e8ea857e30e33124eab066f6c7321b5e60f49 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1dca1ba0a5cb36cd0bb2ea9b88565670fdac53e6f30ca3c875fea8e80855672 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7a9cb1ee6b1f5073d3f7c7130f6479a169cee63f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f12f23d8d6d0c2c44f0170ca34641b1bb1a784e8e8d699cfaf749b828c8a75f +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b8598f0cedf3a46ca7cb506aeb2f18d04c08124d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2083b5c30e6c3c035497b7cfeb39714094f667129090b141d8084e6e62373164 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a8447a9b76b7f5bdefd0f39b1b6f653577770cc6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b70f5bf8fac60b640b2187c52a3cc65377b60213f2ded71f7850dc10cb8833b5 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..59955295f8d19e7792d6e49929bf0c752db430a2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c8e2c052642dafb74006d3da57a94d9c9306028092145c986bcdf6e65c0541 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f755176f14afa24649fb76da2ea117fe615e6b67 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6cb569e20f1555b53eb4f53cf178913a51059973af6308e88e80d7fbc73d669 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..af01bd1b7129e4301da091fb32eb94fce20dd003 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c10380b5de0093221d08675e259c28cad81266bbbcbb736b89a8284519938e +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..63a0fdb8c37d0945ad9a23d8d46f65833d132000 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e3eb0b3ef5dc861104355108845c92a28a0253ed0ed5ded043fe629532c0e2 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7ebe3dfdce8f75e248455db2189605de4c9d7896 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8354d32606026400a258bf43dbfdf82ee2ac7f9c0d5a8cd0b6e0efd49f0bf4 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5e508698117a45273b8a1f8ddcfd62269b5dbc1f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079b48477093e8d42ce59fdda76b74e942872651405aeb40543003fb13394367 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..bc73128592a188c15f4800708f69e6ae5b4f6d36 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf43c44b7c6a93ebdf06025d6e2fc92baf4f02de05678319d71bb4c8261c9e5f +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a7923c4a6ec06e88ebce4f46affa32659db34353 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917ad69fe591df0d61ab6a3c3c9c91b1c16509bf193221231f2bfd5f9ba83b0c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ffaa28dc9ab803b20e66d7102cedc75f43942153 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1033fd6f19f25c974c1edc3094999f5a68bcaef38eb10288e7b52fded6ac555 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8c668dc785bd1613643c1fe059f0b215f5231342 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3f5fb5f18626d9e31c194e849a315a5466984f5e38001d7999298b05bfcd98 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fa57406dc931bc2ecdf8c290430392e9d83dcb31 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d2a2b29f9a4ff50445a9d8a2328151034e572c79b4cdf7ddc3391efa2fd629 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d3a0d5fc2bd4f4626b4d91b20a2d091c904aedd0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1248f7ae916e465e6f7b614c96457dde91ed3a9849eaf408441ffa786020d9 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_25_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e6eaaae60ee6e97e940e76f611518a83a9c030fd --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab252185f13d07836a91840e485a5148681672bbda4f52eca83690ff5840870 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_25_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3944c7e60afde5a182901b1032f7cb144ec2307f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f40d9c3a820036b2e30e283cc66f0bb9d88455470f090be75fe62ac32b81eb3 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6cd8bd5ca4cb294f398555128b1151891c9c2b8f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f80a9658a6bb679459062a149b5a3dfa8e1a9bca3455251acf204080f5e194 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..519355e79a3a719a611ef3e56bf202a63bf74ab8 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e2707f68c209c2988fa2575a2cce0a1b1f9dd244befff2cd27614facc5861a +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..64f0267c413f0c28a7bb5190de6e2acac73c7a34 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d7c69beaabf963accf416811ac15fd7ab02c12ee30d0ec617e6ff43ea18d1a1 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d542e5d996fd3f7b64ad99ae988befde3a34d9d5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4445b537b927b1f206ca34ae5e51dfaf6eb2ae1c580114c7e2da40376d26ae +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9b55a4914f4d8071df9f3220ffd98f8cf08b2d4b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9b82faf6ffa49a954c8bf6379d67191815f78e2eea92d8a62323ed399d7da8f +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d9beaef21805639473dd974762c10dc0f8476c17 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55b9f571110465a12717ab2f82ed12f69bf0c5b53867ba5a6d083f0d3be8f437 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e4cbe305734384b3865e8edef92a2cb131aeb3fe --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0307b4c459f47f2573f766b26383b094975634fc64d00a697c1db727c75e4827 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..10579c617f4ea396165772e435940ef23d87d134 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e60724223092b76de922de5ca1a4e2034d53930fc777a7e95d828dc5b907520c +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..54f06e2532210ef9857a5041996cfd2fcc339485 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f05f4260920980a6f22639b100d67efd2194b6498d61672bccf4f743c158a236 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4890e90586b27a1a417d290a5865d82ff0c856ea --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890b9044dfd4262862b7c0fe60e3e46cf5735696edc3ca33803702810f2667f1 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c2fff349d4ff296fe865181a94c9c6d26d01ba4a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97503f2f66bb4e4be9b62d64708c8b96c4236bc563b481a60085ab0c5002d680 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a4bd96df0df8c35dae34844cb07fe2c1edd62de2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d420894af04098d2be57bfabd1bbb9bcc9c546165b667dfe859714c6c4b42925 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ff6490764d57c7e087a16409f223bff6c7810d78 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b702cedf49a84f6603fd9624253f6c8687bd61408631d3f2d1af5040aedbdc +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..233fc05c95eba9661853bc9c176269f2726ecd26 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d249642f5bcfd53ca811bf2238214e62a7794d708db2d56d53efcfb8293e044 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..dc04b02e96920e535ac6f7c228e4a3037e0676ef --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa1a0ba11c7bcd1d0861c78f323e46b9df7d2e73bcc43a36d391f1daff88200b +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..41790dfc027949e638815b2e752aabcbe4ea2d43 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c7ac4a3647d44475507e3f912003c947e2808a107a44be3effb5b8560c64a1 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..46268a4fcd65c0788ccbaea942b6276e294d2d70 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e411d1928563e2774c29d7b1f029cf7b561826b825e91d7fc4f1afc99e7247a +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..75458b4ce69786b9c9eae0dbc05de52bac26ccc1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c80439f16f37e1c124678a3a5f0cb11e5036ad56c6d213a8c701a3bbe27f49 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..1f40542c847be12e1f0a4120b515b1585074016c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5afc839754db98d53b1be93aa397b9eb273c8d8fcba70d30fcf097b39251f34 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d0ada83df03e3b6108e9e45e13c8b69a80320a2e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5853fa880c54845d4d3ccbcc260aef00085c33c893a061b4d6280fa323ebc0a +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9aae9b033cb671f5819b3d5aeb18be59274a6f82 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d699490cc2cb945494748136197f83a2f82e28d55b47b92bdd1d93452accba +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f5597d2dd957634cf3c042cb0d7b189cbf6b8891 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f0f51acdbbaa7a6d30a0a9e48a7a0ae63b568e823b34a6a1ee2bc370e0122ae +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6f83807de40aba8700e70c3bf6c419e041539e19 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:859e3ab0eb056167f305519509bcec3e9e6d160f8dbbfde895d49303d92fd355 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9d43a43332ddae2928566ce41b33fa7f15f3fdff --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:488c7f5a1ce2f47575d9018bfed3702402d14d1d61d8627c29cf4dc7e9e162f3 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..339fd0627af34e01fa0e987b39361fc96ea6fce7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce9724323c3e5d2e78843e6140fa94eadd6f9cbe27b72df2d82285233611060 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9db0116478bdb2af71a1adfdd81aa6398394aa55 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:722157872892c3e48193567351a00eb8c5d76cc86f7a28649d68044361396bf2 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4c0a440de5841ade928bba83b442a5f3d6521412 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb4e291104cc20b43f441f8527d51cbc643596d3df8c0ef3a5efb106de5d615 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..11a04f49c00e85fcdbc091d85451bdd8d11c5ba3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c24dcc57b359dcc28d27ce9c1b95342c0f757572251aaf39e659182a0aed41 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e2745788d50a8a2e858e5cf897cf3f507f6e0187 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2515b861ce5b0184bcd36255ece5e671dc1fba100a0291ae318516d595d6b098 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c6fdc05657af286eee9c25f06a7b0b9eb478143c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93821dbed63e8a76f9506d60720fa25784ad20762531ac10d0689badebf3e191 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3f66827710efca3fb39c75cb8c8be5b523df38d6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4dde2339e08a3ba830d4b04589cb1e33c23961660a8541300617be38e6e6c2 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5dffae7ee2f7d55895ff439f49096205622e83be --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134cb22bd1d93d64b4f1b10a6851ffc04b8b48d02428804eec7e22da28d92241 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7decc12611f8e6431db3599eb86dfe46dec77b56 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c9a7452028847e74349942e22f9d220d13968319f936be57290d9404cb2693d +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..eee6cd1da4449bee7ed9e40ee498832d6dc4570b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053b39a8d4241be654a56a5af1cd0504907ca6f08846e29d456954963dec99ae +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..91535110b4827114aa9229b071ed8b1b5f809166 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a059a9bb26ae1b503912ae7288147c04b5b3dd12b64e102d12260e1b91c093d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a23f84fd0768762f2f834763da6d4fa365071288 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c318f1779ee56851f520e02784b85b77ba1d2d0097d95410f59038a00be12b6 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..65dd34b0a6c355917fc1cf16e538361005d50cef --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8152e9ac3ba4567ca568435501ae9168e9b545255d99ea83ac6a422b8ff17a4 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..58bbe7b344648f935f23a2b53d66aa0cec4aae40 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7adf83d34b507768708da874a413c9f090da546cb434b9d2723a9db79150b47a +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0f04a4da42ee87f10823cd708116a8b16bc8153f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beef13ee4a201bec404d3047a8a6de0b537b9cecaab29bbf6e410cb0b23587a0 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3713637886d86a6383b04ffbc0dba1394a92d6fa --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421f4e6644414c78a39d156d0f3b65115ec9fe5cdbec0cc54652bee4a346add2 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..118b22ca14d0af957eb85b9d369223ab184aecc7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf96c704189cad4f9e15fab998c55f103be9f986e58975f0b4a818ac5acec585 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9fc660731bd34e0abeb562e1b7bac153224426b0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e19e501dfa9a925a8e1f8b0def4c898f588db4bc6db6d608628d1d86e67f0437 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_34_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..bdb61e375145f3dd13e027d790fa4e0af24c991b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb49daf0f1f93d5e36a845d9475497bf5261e787d83779c3872ab61e5125887 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..6ca0509387c2ab965b1c4578207cfad8dc29e9d2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c69ceafdacea70e5406659108ca34bf4c3ad0ef4856d9a7783f9bb952d53930 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b5bc332fe07e3d4f3ba864a852ad8bce0c074515 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17185a36603c84fcafd11d308b634ad39dbf5123f9b2770cf21fe9e7d818e564 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f85ab5fa44e7f2e17749e72a71f7ec55963b201f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c694f7e913d5d4d02b19b98d6135a51a0c7bd9182aa9a5e386a9694a37eb94 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2191a943d8f5b263e397e62f6f08b15f6bd35946 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b124f3fd0b79e003865f193a6f4539d8cde1a6d815d61e1a0a08c4ce6911e6 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5a3c21e305b58b898302929c19793cdabb421f90 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b6526a4aa9450c08656d8969c57ec6f85c2171caa915304f9877eb7888529c +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..59d5260d2400ee7a6d391a1fc5fb38a56c98d695 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c7d90439a3a4bd590b6f5443143b0a5c0d6accd628a257afa2cfb65decc706 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..35ced123c5ca0e7b318430451a86941d5a7f9801 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d05be2845aa8b454821c0eae7fbfaf18a4c898923ab6984e0ced8bcc36b7b8 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c4d19aab20cadffe0c9c65ae24725c2626bc82ae --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d287b6b2cc2cd8c72c71c362f6751b617b7b734cee4ec226ddfe96653fe0397e +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fcd5c407f2b2575789fda2c983d206575812e736 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:845fc00d92ca43e1ba1fb2c1dd6ab931751750fe00ab400ac0ab33b57317b0ff +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8aeffd8b00b24dc8fef1c26f9714904a1c74bab5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b947bf535bedeb1b4f307edd3fef02a39fccc430ea749683006f9996f0e9da18 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a41981944fd2b4d455c6115d0966e323f3ab1281 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df791cfff1b02b86e887ec69699855b39b6995fd5735462ec901fe014fa5107b +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..babb8bfa31b98d64d6782a5be82d0356498c155e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eeec926887dcdcbbf005a89d8e68ab791eb263a46718cd7ef78fe411c4ff081 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..397970f6f61875adc95b048fcbd45078d2082d74 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60ddb06c1d19cf2f9784e98612855987c767a9d453aa41e23d077ddcc600564 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..289d350e4f6fd516b829b5df61c2edc3c27e7a1e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665d9904f097430342f88309ab63bbdf9c485fb2e6890b246a941235a61ce75d +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..79d1a087383607c12b41d3c08c115c615ff8e273 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6cf091a2eaeb78b3fd6d7c00362daa7a45eb710f056d4cd7387c06c3ddb8dda +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_5_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_5_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ca2313f387a1749e4780b4082c2e5267b146833a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd1290eca049ef78bad9357bfe461df4817c606db786bec4f16cb3846c49d00 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0e113cfaf2d63821cf5d8e518abde356fffa4228 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7bb4901143c10c4d97dcf3c2535c40d8beca62657b56d955528f5552393fdec +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cfa5f9cabde07da580e00dc81874aadde74bf460 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270aaf42cabcd617461d25b87c8957431181cb0fda7d2e194a95e54dbe8f5332 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9f8f4b93f28aafe34e9266650e77c95b731a826b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2b2297fc6f52060ffb599127e643e96f694cbdc98d0d70edbe876c7a92197df +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d998b332f6b13d0aa3378b3321f873f63814b961 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9daf5982ad731539a0232d787050606c7042d09d6a6f30c47dcc3a3fa8fcf84 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3c78743c2eeceec58d2aed29079264058f7feb75 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5e680a98127fe2c3a318e7c1b3019644b15e6ad6c6a580bf4cbe6984cf0003 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..dd1dcea27b352ddb95fcbb595b1ef8ffe05c6f37 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa5cc13ba884641f8108a1c1be9833247d0390a8b8dd44e29434923fb1c123d +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d74e6422166174f3e01eaeacff18fefaabe6469a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb69255f06c83cf59330a2e54b926cb8329d3ba4e9a2bef59fecb42e38ccffdc +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f02923cf2351713ffad3cca1134fb6ff839b764e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2e63f629f94633594f298db2247b64ebdbf6e1e48109b3b7324339fbd38b14 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..65468d9193c75617a437dbe7c6bf92e46ba163c4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66fc280da57ebff409d9fbc33be4afaccd3c17612aee885dca2f5a8bcd8ef8ee +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cd43bb2df1330f21744e6bb6c3c4b4532529912e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca6add92a9eec2086075bbff9c7e5765b537772f2422036fb8c640e288896e4 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..65dce34c981bbf5458f38de5f0e73f6c8468d3fc --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c7bbbe6337617f82ec00dede81dc6c3764f433837c973375b0d0664192a1f65 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fde2f2fbd226d2eee277060cd80adba85ec57d48 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19df0b025c10a62a31689c569e121b09344805c1bbac63355d7a5fae81c27c3e +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..53699d0a45d9c01a0cbccac96ab3c843cd187a0c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36ecd6642feb15b7f7b403d3bf7716b68fdb2052db2072d85730bfd2d5c99200 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e72fabbd12d617cf569fe74f75482262d39c7f9f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7070733c978bbe6dbb00331e74c084eed5cd1a74212c8db07e10377ec644246e +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..62442ed40a14d6b294e5a5c039a8df3aa09d30ce --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c3fc49740f309fdff293e9dd157443d39fe8c50af264048d978c6dd2b56ac4 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..678b5846bff0b9bfd5e5932a04104fb473947540 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f8ffeadd1ca88733bb7ff428f1b72345fdf169383c07e26d48a3813d095e3d +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0688a68a29379d1960ce2cf64357736816a14868 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9691d58bf61e2a3a9c5cfa2668650ece166f941ea2365fa3fc08cd93b0958bbc +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..71ac7025f6199d4f16a8ee47b6d0c5c1bad8eb8a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313c85ee28363e9a56c3c1a7e600c1cd7660e77fab83a7537acd00d726aa4c97 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..218bd734eabe4bac49226bc5d7c7c3c14f472c54 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c052257035ddfd6236197bc41ccf55219d72297890c526f48dc98eaabd79df1 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d17e3922907f7ea6bb1c48fa87697fca742856c3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4555ea85035d4cfe76ce3b5e83ae9458c12c3f6ddec3a11295c9d2574e46fd +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..127cd74636c5bbcb4743371bdea6ffa7ab1428e0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08807c7088cf4be9516ad590d1f6e960101281660acc04a6b2298a14ffcff9b9 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e77011c59df476e65b44825f83b7bbb0755fcf5f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cefa8319ba9756fbccdd79a316f255e46f2fabcd8a4fd060d31e46196dea0e4f +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0a18acfdb73302c32510b9bd32595e270d50cd5c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26270677ce57df024821faadbd6f24ace96fc46b10946ef8cd3881c23ec7db3 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..73e8336a778be40274bf24d03d808149d1d93cda --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd941b744b1ebac8e08618628f969053d32172206c504d9ff507c8e16a4c16c +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8fdde23646a6d358674e21076093be957052e705 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7d15dc467cac43a4bc0cba83048aa08595b7523b5fbbf26c94e8c9c48dd3b4 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..35ce785c20d6595612253c94712df4205f1235dc --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574733d0ac96ef042a2ac3d7a369aed26ab9ee1722641b0d8bb6b89da26e3fdb +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..61302332dce26da955e1cb7007d7decaed2d2b57 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d4867fd1cfdb8855653e3a655408453d001e6ea33e9d23695b4c198bc87cd7 +size 1310720 diff --git a/qwen3-4b-log5-unary/tokenizer.json b/qwen3-4b-log5-unary/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/qwen3-4b-log5-unary/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654