diff --git a/.gitattributes b/.gitattributes index 154dc814f1d76d215cd8f1e23a48dad24d323e4b..5c4afd7258970e0d19244a833a39029e96acc76a 100644 --- a/.gitattributes +++ b/.gitattributes @@ -797,3 +797,403 @@ deepseek-r1-1.5b-unary4/model_layers_4_self_attn_k_proj_weight.planes filter=lfs deepseek-r1-1.5b-unary4/model_layers_9_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text deepseek-r1-1.5b-unary4/model_layers_13_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-unary4/model_embed_tokens_weight.fp16 filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_17_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_10_self_attn_q_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_18_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_11_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_5_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_25_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_5_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_17_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_17_mlp_up_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_25_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_21_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_2_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_0_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_23_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_20_mlp_up_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_4_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_0_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_10_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_24_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_21_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_9_mlp_up_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_20_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_22_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_14_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_15_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_4_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_26_mlp_up_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_6_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_15_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_11_self_attn_q_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_3_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_16_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_21_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_20_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_8_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_18_self_attn_q_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_14_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_11_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_7_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_7_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_19_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_7_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_21_mlp_down_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_0_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_21_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_26_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_10_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_19_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_19_mlp_up_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_4_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_25_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_21_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_1_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_23_mlp_down_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_13_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_6_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_24_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_9_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-gunary/model_layers_20_self_attn_o_proj_weight.gscales filter=lfs diff=lfs merge=lfs -text diff --git a/deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..87453d6073dd140c9cb1fe7be413b4035a9817c6 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f62786480e272b2ed469c552ac304aabbb598108c825d9c9665c7e86777a47 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c75e9f7883463882c7fed4e8c9b3f7d130cfe90e --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b49338069c9db0f188c0b6e9b2a9bbb1c3ee94d02d186706f7d297872e2711a7 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_0_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..80900e8f104c2f71522508a35b545314a0e0ea2a --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83d28ebe8f492a9158ad1a8a133f5d0e1017c690263f563f08bde04eee9c5db +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_0_mlp_up_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..de391abdcf44e3c13042a96ec501f829aaa3e1e3 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_0_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d9bdf4d1234bacc928a5c169b655f1e1164b25526040091ab94f650804ea66 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_0_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_0_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e773326e4ea0d075505e655752ac141a0cbf12b5 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_0_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556096531abd03fc5e5f04c6d35b923f99fa220b279f136aea4b8d2af372d579 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..f7c74df4fbb4f7c9fec48ad9b4f1f64d0969e161 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e19a35ef06acc8f5d6566c9af77f3dc578890077dd464f46252b7e812f3217c +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9a8f223f9fe8fc9869aed75a9dfd41594096bf16 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_10_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a44f8cc78acaecf3ce04f9c82ae74c8b981ec9c16ab2fc83b53d970cd02d12 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..19c6d7af6824fda4ed8fa35343d47ec0d92ab2de --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd02eeb3ca3e5e87712fc9a0ab22f0776fc4725b77740493499225d54b5cfb20 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..3a58b4e6aeab7bbf001662b87e0e720504e343d4 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10efc6f355c61758546a025d5224854654a26a7dc025d2b3223619b5fd6d9437 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_q_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_q_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..c1ba2a266093baf14284e1900185bf4d0431bb12 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_10_self_attn_q_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c07a7242f454596ef980d3a493b09e0256f3be1b1eeac073ab967d339067ff0 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_11_mlp_down_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_11_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a65480de952c184e7a9a22de583530907a8908ae --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_11_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4847d5317087ec5fb48fcbdeed53f33406317164757b57579921c853d4952e9 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..dbeb26407843a6d3bf541463241d952837f6b001 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89dcf3fc7b962c525fae4ef008d366bc49a3e047009ba22d3dc43c9a6b84d2fb +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6628c1f67883634eb114bd647c6a0c8e7aa39b50 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_11_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e806a7cf129ba583e070b3b130586dc8817867227eddc8244a38a4c322dea96 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_o_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..94d06d71fc7ac345e79209a753def677bf0753b8 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5fa0b967ed7ef8ab6e68611ceff0a2509fb8bf9844ea315d628572265e3ba4c +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_q_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_q_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..6bc7118ed1f518d76aba90eceeff85ca4b7b16e7 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_q_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b78534d997cae0ee012f47a780c4ec9731aa9e9967f59d53292b783ece5fa8 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_o_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9dfa0a259861dbfeb4b7d70a89660771a18b84e5 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9369d1267c574eb177b974c5234e1036cb2cf6a6192440c5c9e91da45d08a4 +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..596a1958f2725536b44c3c35b00a65e94c39f7c3 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9183bd87e537d7e24397454092cb24f0ca9f0380d67a80781b46e8fe64b8bf6e +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..68521e8c93bf651fd7a829721cbb52c9e02530d2 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_13_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77567267cb678b75a75436084cd6345d32a1fefcadc4ae5a11f4b7908598bec +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_14_mlp_down_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_14_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..725ecc2605289a94d5b8c783454aca5d6c2d49a3 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_14_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb5c8ca87dbd7b70c965623a171e81db5514b89442c6ae3028faf3677ce51ce +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_14_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_14_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..df4f7e6ec026d879eb2f6b6bcab7869c3be8053b --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_14_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2f382a9a3eb87a5a14022d6247e27552a29c02f980844bad68847a20347ad6 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..f430f5063526895b05885a5824816cc3450a1bb4 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3636d54b40e62d0ae2d034aa949568ce9b86c7ad14daa17a771f65bf37d76093 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fbad38bba12783704a7250f383f9306c3384a072 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f24fab77596535c98d31e186283ab317b45b4f01121b254bea3ce96c420cf9 +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fd6f2e7c532aa5f7ef590882bf23f97b9e76e091 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_14_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1d71717a33bae43b6cc287107fa866ebf2d3a053742a709381035b2c234a66 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_15_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_15_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..878f92470c29625133841d0af6fa1424bd2b773e --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_15_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3d299280e2d994f2ccbc488be50f2c21ce6eb92acec7dcc45fcb9bf1d3614a2 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_15_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_15_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..13e85ef324237669a716053c37ccf3d79b11ce57 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_15_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:664e41309d4c02a6256a3195cee51f805bbd8e0cd402a128a56f1f4e889d1ed8 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_16_mlp_down_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_16_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e9c6856c4dcac742c0d31a6003b89b355c3f9f6f --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_16_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd675b7630cc6905107d8978b6875c50f17c3adaa2d32eaa0df8506d25d1a297 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cfbac62157520b0d2dc1cd7890d4af078574d9b0 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91a1d6f385ad3d88d5e5c53ecf35b89889bf5c3ec372d052f9c744ff2df5150 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..445b38859aa91dfee64aa73b4e2e49cba18fef7f --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_17_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b662b9a71e1c30f54e9781190dc2c4847527cdecdb022b85b3909d2b4c11cb +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_17_mlp_up_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_17_mlp_up_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..c6fbed06c38ddaee1e7fc163c99e1dd208224c5e --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_17_mlp_up_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c60b2568946e4917be427453919b81ab9eb10d065e3c629a2fe71512fedaf0c +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_17_self_attn_o_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_17_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c8412571cdf7c7d7a235d8e4e1e77ac4c5277398 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_17_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7057ab1398767efb88fd1695756e64064a78d4fb909c74dde10113e98ea3961 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_18_mlp_gate_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_18_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3a7e4174524872129dd9b1f87493b0021bec5ccf --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_18_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da4270e466c8d0be4527cc144f503fb296a5a5707d1049a1f5ebba2fa5cdb10 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..c910895c83eab424dcfc294ce7f439513cc36d2b --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f6e603eba0d028243475143858f84f483936b40edb059f7591965180d43bf1 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b0f9725b406834a08492d7d164664fa27841b26a --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_18_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043ea7daa9281049fa820608b120e4c985a3577629f4e72f6054edc745347496 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_q_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_q_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..dd3a65770aefe40c31505e2ab9a7993e0ed4ab9d --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_q_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734ce6777ce6133dcba5fbf6b3ac05bf3ff10d3a7c8abc153de7e1a0584c82e8 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9845ac73274d3930a4f2e07b20b1a76e0b0bb8ce --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f655d7cdcf1060a1d2ae7f4ea253af59d082f45041a2bbd8071c384bbd18aec +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_19_mlp_gate_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_19_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2c8f146dd4134ca79ede122829cfec78a5b8830a --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_19_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1571370b85679b6c52d3d6f2ef1b76f2dd7f801b28d65dc1e85b755243c36e6d +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_19_mlp_up_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_19_mlp_up_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..3981a0cf71e02c18e5c9ead08f62df4dd11eee17 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_19_mlp_up_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc18786161e2b0c95165c34e2acbf2f29eba79e8e9168bcf6e9ce7b89113763 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_19_self_attn_o_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_19_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c234ac3cb907c459ee49cd19c9ed12b392cb4159 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_19_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1067f067d104241cc94d0b8e7bceb2cbdffb74c4d41fe6eb40a9bfb6f5267df5 +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_1_mlp_down_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_1_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..77d17809a9aecad59cb80b3a0a7a31da771b2d6a --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_1_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ff9bd22f2dd85190a685a281007fd84a676f2110e201f70c117f6c2a9fb750 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_20_mlp_gate_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_20_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cef86ab64aa7b196763c85cd8118cb6a6bdf2546 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_20_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12da43a0806d2e61f9672bcad20a1646733789929ee8c1f5cec83f638dd6cd36 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_20_mlp_up_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_20_mlp_up_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..7fb1d533e88810329df8c7ed1242878f165c38d3 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_20_mlp_up_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a141b1fe1ce3804b212901c841b08c3ee808dd961b68ae62d0f76a20445476 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_20_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_20_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..04c9d5279d4849e22fe28d38f2e1f9881a9d6995 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_20_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995ee1315098be36de0cc245f5085ecab79c813b8966d152955b480c288f4d1d +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_20_self_attn_q_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_20_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e224bf35fd7094304bae2f2701d7461fdf9d5e57 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_20_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b42ce46e2be8289a439a9d67d24600d151efcc389e85a9a5c17f822130b4b8 +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_21_mlp_down_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_21_mlp_down_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..4b52fb38df20a2e37eb372cedc2b4889e0085313 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_21_mlp_down_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14201e8f76cba5255cd5b956e5eb8747f1ac83c323bdc1b4f0322ac3fae9e585 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_21_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_21_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..f0ffe94bccfafb4be6330cf984dd1324460fa3e0 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_21_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4116492b8ccbf686d2709b6685c8317b39beb150ce05af974a1e8fea983a739f +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cf53b108e3c7e5bf5d1df71c31992718f3659d42 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ea82664a312ba18c7166b1ade4bb403ffc8b252f524cd4094c95a2185f5c68 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..e0d3e3b32fd26a430edc68c53c8677c5c5bd7cf5 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5fc7eda51e80d3d3939b986ade5fb1f06929284b02f2f92604c9669e5e63c3f +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..76a6dffe65dd11314ec5764d82aecad61358cf41 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2de5f2a6748bfae662d5f29cc9974111ade6445151f4ccf652d60c179f5d44f7 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_v_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..67a2aad129118039aa6108dce1bf55293744acd4 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_21_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9406e8c7ecd1697faf5397d877ecf33709c03ccdace67ec727695b389eff1534 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_22_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_22_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..12054474ed3e36f94acc0ea12aacc54cbb8eea12 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_22_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb931cde603a1c88e863eddbcfb16be978925184c7667f0a353d499616ce69d +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_23_mlp_down_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_23_mlp_down_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..1094874bf0905fb4e1db2e11d4a44d9bad3e58a1 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_23_mlp_down_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e01aa28cdb162a3d9b8d0ad40928d044af22fd338c449cc8f781c5fc3deb140 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_23_self_attn_o_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_23_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..55a527bb3c1ecbbd996713b8b7b663867ebe5474 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_23_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77a2daacf3897a92ae31cf0ce42214a146ac3839e2a21aa0ebcd531ca44d0a5 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_24_mlp_down_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_24_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ff17124f9d467c54aa4ed5a4ef9b19ac812661c4 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_24_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86cca1f83a0b656b5b9e895a32797309e95088fbac4b80be1b53df380e4c1b66 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_24_self_attn_q_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_24_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..518f97084ba09f73711e30ade60a688b71abf13c --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_24_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd1ac82464c0a75edcc0ce8d723d836f8cbbe2fb81e560f9474d53fd1e40309c +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_25_mlp_up_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_25_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d5df6541a4059cd7da98bea06897e6122409184a --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_25_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f7231670f203b05238c18395c088e64226d933b3456940936b9104e3aac63b0 +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_25_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_25_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9139e9f02cec2cf7af2a81bf3657c138c1d3aee4 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_25_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad26bc1ae9f3077986b970497328e2537bfc2f9a06290dd310c5123423725a7e +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_25_self_attn_o_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_25_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f3350f293dd64fa6cbdf4dcbfa94046d071ae82b --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_25_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359c872bcc7db32a9cfdf8bf0ca87bbf1736638d5e2e5d9082070e81d799c895 +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_26_mlp_up_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_26_mlp_up_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..9a74396d3afa89bc30c97d276e22a204833dd9b0 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_26_mlp_up_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d2108af41e4058a7ed998a4b4e5a08fafae9a8781006d1f298fffb37dde583 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_26_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_26_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..efa6edd3a260dfde31f724e0b24f794570a0edcf --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_26_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64cd45387e12da3c6e36de138ee43d14b376ff1d9e29a5c578423ced5d588610 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_2_self_attn_o_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_2_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..dedc1ef084d019c2871fabc2d811b83990c74081 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_2_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b68e9039d9c4eac2bc530a3c6f30ec6b4bef42514ad763d6426927b5ef6245d +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_3_mlp_gate_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_3_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a8a4a34f4627de28681a7ef6baf444341add0356 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_3_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f770399800a7dd1df24cc413f67013848e44dd3c181d48d80aaa11dc45202a +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_4_mlp_up_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_4_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a8bc0f269ddef0422a3f525f4b5e2d5abed07ec9 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_4_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b418a31387b4199af39531cf39431d134b925dfec9085f195feb9bfcabca215e +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_o_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..53d40d08f72ebf332c483a3503645e19b1881f60 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c9536e031168e8705f706b0ec2d553e9096613648ca8c324b3123192b9058b7 +size 2064384 diff --git a/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_v_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..88293f8724db207f87e65fa02322f4f83cf4a899 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8c2df493173edfe638dcb0a731a8cd9f5e46811ece8066200e62177ddd289f3 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d0e487e200211ab2048b056e6d523ec5ac2c0eb7 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361ec6bf5ba2ca5034457b7b5ed917a82d2188c05936faa33f18417ecfbb2ae4 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_o_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4713697103e199d6d1764fedd842080e3feecd59 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_5_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c011f8749c3f0375bfdeacd01cc0543cc143243520ad81a832540af962e82e5 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9bc0ee27d9beea997f7bee185bd1f1be441b24d2 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92cf632baf0054d1818120a76eff0e053874d3a1731a0b4707928288fdda8dae +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4efa1ba0a0818418d8100943433e79f8532e40ea --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_6_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d33709c502641f073aa35f245dbf6d0cf1476003e40b205adf392cc2850e22 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_6_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_6_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..37b44be713e249cba5b8077816ad96d2417ccee7 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_6_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22d5a8f2e90b90c1aa441c76a117877f7fd68b5dc838b0460099aa65e669130 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_6_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_6_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..5e5bc53d7fff1c2ef77db080b7ba6848c53acfd0 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_6_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6894fc15b596ac313b3d4e207f5c03d14c912406607a8402bcdd401888b13e26 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_7_mlp_down_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_7_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f2bc88d3ecc168172d9815944b90a249f1f3a15c --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_7_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087599244f33e6fd7a31116288b6b30df58d20c8976398a921c514a79c77a640 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..d792e8347367b0dd267f80740272825bd8832190 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d4aa2850779cbc7e6609a8f36793e7ffd914455cfedeaa6079d5fe35ff7093 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d18791cd1d7deff3a55b2a6f070d468dd27e44f9 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_7_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8902346d42372d9522a6c4ae40a380c6efaec66e66c02d1e4b435d07b97a0358 +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_7_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_7_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e4317211761b1e83b5112d19e59467e8a51bd1c3 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_7_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0f5174ef1e027e26b7f72c9decec1e1cd168ee0abdcede355593c9aa2d0955 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_7_self_attn_v_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_7_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..20af5bcf41f34d83911fb43595d298b4954a4285 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_7_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5194a42843ce15b8e8b150452858e2e409b1238c2ddfd8a0323fc563ad4ab541 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_k_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0e54ec2f9bcf8a1b2d850d29a2bc47385e16627b --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c489bcd89b186ec072671d8f669c6527243b8e479d59677aa7879b7b456e459 +size 344064 diff --git a/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..01ef0ffe01818056d84b219f5ad9fdc1ff53c852 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ebe48f0589cf5ac68b70644c4dfc595b8c487ebffcf30d718223b51d22a29c6 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..23166f78fc7398891dc4b7a225fb238bf2c1a4c1 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8181b7d57154cadb33048e837aac7f6e569635e65c142365c909cb3675662d +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_9_mlp_down_proj_weight.planes b/deepseek-r1-1.5b-gunary/model_layers_9_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8cee4c250c1da35f00d1b3b881e08cb611892a94 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_9_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3116650c6f3eb1bd55e39fb9107702ff5f09623059e98b187ce20f43dbd7ff +size 12042240 diff --git a/deepseek-r1-1.5b-gunary/model_layers_9_mlp_up_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_9_mlp_up_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..dbee9d83848433213ed68b46190833df4db282f2 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_9_mlp_up_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53426d4814c82790c5b5e3d77d06d4cbfbae5f0eb0f9107c5a9712f0cb59368b +size 1720320 diff --git a/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..5f616be50cc52397840d6c171339b67716e67373 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b78ff53ef1785c8ef630ade597c5fe6b976b38201b284fb4666df16e40b0d318 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7779f95a229a2f7df437f13048d611beca13a501 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086eb2f7afe654b0dc8994b401a412e911b5a95214c23afcb78fca520086e017 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..1d664feb5bdd3e9e76498511a703c303da181709 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.gscales @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f62191e551d819a65176c350b2de012d257e5fa31da3ac84973707b595171fa2 +size 294912 diff --git a/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..df93509d64067043b6f37b652ff5aae9ef8f6ca9 --- /dev/null +++ b/deepseek-r1-1.5b-gunary/model_layers_9_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b073e52123219e49d4c0d15a9a4f5f075c5d9d8d6171ef8e0bb462e030f00a +size 294912 diff --git a/deepseek-r1-1.5b-unary4/model_embed_tokens_weight.fp16 b/deepseek-r1-1.5b-unary4/model_embed_tokens_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..41dc9c1ab0695b778c586bb83ebd9fd020f49ed2 --- /dev/null +++ b/deepseek-r1-1.5b-unary4/model_embed_tokens_weight.fp16 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55610c68685326d482c594ff3bb16141e71a0d219fe729211562ab630953c6e +size 466747392 diff --git a/qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..269cb2476c7f3478f7419923b6c3f65c6b394f55 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2554f18159cef1187bbe2fe022050558e2a8e8375a1b7f35b1e10a39378138ab +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..038e93bd4898bcddfa8d29b193cb8a39c52e5be5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac29455ece6f6e8f5659cd8ef957eba5c86fa5915d55dc0e9d7e173732823eaf +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0df5f11dd7b3d429109cc118e0f3f445560c35c9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b04d509621af722d7a8fc705a15c728edb394b65450cba87ccaf0cfa7e45b2 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f0b697457b7e8ec09de9984953e3a26b6aab2d25 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687f80e55fca949b5c451e07165ffe36d62ef6385c90adf44cde4de1b7c0e470 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..36a358d7ae4eb9f00b017b0e6d79ffe9729aac34 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1321cbf3fbb8334b1c60a3877edf92c14f8ebfde787e6e26a60fd44933e57c26 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6f93fa75f6c20e21b42eeccb7d06dfea375b2c04 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf856ed09cf64d2a50fd2b6f0d2498c8b59fbdb9ecf3bb0ae431053cf7e2d6a +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..02c7b33d4710c7095a3a67da0e1a6cd5fd1337d4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7efc0e04b370e0278615edc65a5238b98add2d3aad780beaf56c3443071bef4c +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ed5f7c618875d03a30ee721c50a96828df064df7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_0_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfab32708f5ccea890bc44ccb4a7097db91a2fd30ad7a5d9012b9fe79027f883 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1012c0ae149695220859f4367b99a4d52aaae16f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d14b515de6180766f85a4416c653dbf7a027621d0cf1997c6aa49564b4bbbf +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e85a724b838a3918b3ad9de95175c7719addb8a4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64822bbfe37a97d2ce01d3808700b2c350a4669e7197ed8ac28fc9ea28aadb5 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1dfd33e3c3681fa6992aa9b41ec87badc2f9fc34 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77164340b96881d131543dbd939e9750ebe7beaac692923dde2b369cad1b09a1 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d587caab897c6b5fef977691dc91d963af4a5fe1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d55a13692d1344289e08fc66f62b49b7dad43902b624508c405fd7f77f8989a +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..deb038c3dd425ced306048f956a80d56eb39dd9d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fba70f2055d86b7238f5cd783ca64900da53c51e91116319465aed1a4ae1e1c +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..09d59056672eec1fd0058461061ae4bfc65f8bde --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25980a86f6836e55897174db69c7f721c9f1ea41400e7752400c32a14c59e565 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d4c96aa36dec1eff8f042a5f6ee53bf05045d615 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ce803f5edf15fb50eb88df4c832ba87c3d157fbe371546227230b1a28ac460 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f780e016af3986051aee8273bfdc52d8d9d6d5ca --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_10_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f3df5227343258d0af2bb485cbcc30133d934ab1edfa318260a2597731406e +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f6da6f6f1ea7eec3e612a74c315e757a8a5fd1f1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66bbb326a2002af82d837fd9a9590a15784eb28920bfb03231f535659fd181aa +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..2e8c0e4099632793a9d55795a1f229198f0f2568 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6992b29a5a305cd3397229e3d8f927020a252bff856671b9f2508a9110c1448 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c4f8ad252335f5e016a03aeb0bd099380a84d34d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc1475c2641d67b4d82f01fcb4574684c1ccdc23b5a9ccafd461a3f6bde4749 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..28b1db6ced30b1aa8ade17f81e187c84bc58f3f6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a45301c2614cb91de5d11318b1f0010738dae04e707d4a4156ac2b93346c1240 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e13ed30217b6d4ffb133162d96a8ce92b3ed92ef --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92eea875cbcf13abb36d71da48fc32b8cf4fc90f84894856f4ed4253e11262f4 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5a315c77cb8ae0d5839bbff3e43207a8176d756b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76257198444ce4c853d982fff54d441d43ba9e8e75602cad9fcd71988edb406 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8d3e51277feb0dd1e4212751e4a526a60ec89031 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7406f269189bde15cc5353126d0f14aeb72a712b000fb869599edbc6f1438b0c +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7d2c45c7600f6ce29dfb99e71ac9bb5fb09e0611 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fcc9e879c040d700d1b7f26a5c26d60ea9e62b9ee576d4fe67c10c392b0531 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0d941e74dc5d2e1a10348b0df22673a6a637108a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_11_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95c162a4ab74a568670d8899d8f071a2f788f437f8ecb2810e7bb3936b8b313 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..95dabfd7ac7dd2ba1eff98218a32c4075239bbbb --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa80df0b680cf6aed0ddbb89d9c8c63f6febac41041efeb2ad2077506632faaf +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3796e7a376485fd8a519970548e5e56f0617a1e3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a911ce088f7e59bee68aa55e6908cc46749cbc7396bbfed40d10a5bb1b9930f1 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..84fd88a57611b12bdbde649b6d428866e6f237f6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a670ae074a22ea19e771c5a0117007bdc20b33fd1d5ebac8915c96e043180f +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..45f15e50e5be0ab73a2da4e22a22dfb058cc8ff3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65af173193a6a24a2a020cbd4a17fd191415cda4757f64271cc389651902aa8b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..aa5eaa1482397205c1d18b8a48f9467e89b714c5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92064250427f9ae3545e5f6cde3b9def2e59030244de9330b1ce79827d124962 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7df60c2ad618ca2a89ec21aee77aedd3a77f7664 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3372e68e7a451b8370321e363f0c08192ca2493938a7c228733b7b11c12986db +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8b978f5f16a3fd711daabc386d39acd48f5f2ba6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c1f7c0b2d8ba7e67dcba589e7a0a4d8b6607a9792bc8020422745c9590ccfff +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..bc9a0ce6e52367731597ba6d730c073f9464cfc2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e323ab51c8f7977af7058955b883323589e35977de48c9b235ad0bbce32ff73c +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..61fc0d4072afd62f8712c4333fd549d2dc2281a9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7c25dbb6e1e411d7dde4bcd12de492e382d4cd7dd8482df8163b8429080d60 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5164c2066cdadbffc553302ef4946752779b1405 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_12_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526080272d6c2ebff8efc3caafce586fbb0c0c1b925566af8ecad7729fef3e48 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5c265ab2495ad832ece508765f6450017e7d5361 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e715f1314eb7b2d92e058d169859a4d0db742c70e29153970d5594ec9e03d90b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..130bd2fa6dfa2b80d3b1d3fe651c3f936dce593d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09738f7737999f126e0704df5aeddf1d565b0c285196ca5252453c1deff0f18 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..65f8aa0f090777728a92ac66cba95af83b2ba468 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c809801baa0e4851980e4d4db2a92e7b68c9e752b62e80f96605db8ae1cee3c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c8cf41bb533f6c58dfeaa2c0920eec22f3246598 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42cbb341007e33214c0b3f6b2172b198689bbfb145c8c5412a38ee685946cbc1 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ad1b06ccd6adddbe7ef3164ecf71b24dedfec998 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741bc10bc00fec70372a4aa171613bbbc278dd1e15f7150b53d115302a6afdd3 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a68e67e314945e0a0ebbe5dacf01210bfccb291f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31de36541546aff07797b092a4b2177d1543eb2aca0b3802eb12b4f0ea26e146 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f92416172104f4a509b3a41fb60543f60f57e89d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b96455218d4df0dc16754f7f8b7c27b4ad364b8e1f4feadbcacd52ef8b8494 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..10e1c669a4c86abadca46ef59a5ace3dba1fb1f3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbea06e4a803a9db517fbd62f9e4dac61d48c13a4e356fc61d451b53c8789a39 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9b09a5b824b96f68787aa5a7c630b88011deac6e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9ab15cab51765a2158eb0133673e5a868f784eea26d3456b336d23212752b3 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6f9c69a7d0d822f8db776283f1ba0f99bbf7528b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_13_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17b47e13c185757c11559d6cac4f32da5443946455f52a65b16970fd90b53c8a +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ce4f632d4edd2bc62c9ca441cc79b2c34760169c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3194d6275ef7bd50f88653b451b22f99a512b9e40401de8c36c15da28240819 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ac71cc0cea8e884e2ada8aed2c376cfd0e31da08 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa219ec8fd54a3735f44f34be9bcd38d54ccb3751b16355ad557c01dcaf4f4a +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4820de4e826f553a9294f3a1138241d5d805355b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e87ad4900ca80f006caea88a9466cc6964eaedb8f608582ce3bb4abc2a7d9f6 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0eb88b0b42704609493e110372cf0978d4b92900 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed51b404c79df4e504af5d8360a7d621f1354428a1b67d329be88f1e460b16bb +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c2b2b414ca3f1c58497942973fce3a87d3c4920b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a54b5c350241019fc649cc6024f49e0eb9834b9a9f4d8e4e3e2d9f7b686c86 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..733ead33ab2db3300cc17e024d7e6ea4b646fc21 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb96f6e577a1973ab4932366278fca0846be24b2c52eee86bc448d177eb0844 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a611f1a40dbb855d2712b0ffdfefabc316f58968 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84b0ffcc993e507520dc5b701d174d35d0ee91fb5a7a543d42000b9130912e8 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..6eb16b0b76b73e8653afa496bd40af19e30d6b48 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_14_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b5b69f3b2224fcc56f88dd54f19de1872aad505c7e61ab313df099fd613d17 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4da8cb80db993c3f4ba73d897da21cd23a718541 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0634ce8dbb4d184ff0fb3bebb31975f0679f099408cd7a940c6137dbf5302d8 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fbcb242fbdbd5f8b7fd2cb5c4ef7af4375796e7d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dcc98d36f8bfbb6f1dc7ca6454edcf035793940a3d54b0083f0b41bd8d849ae +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8c75c1876eef7178aafe7eacb837e1c7a063e125 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b643fc24e406b08b608035f17b5c4662305202d47d8c6faefbd8e0c7d5224f66 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..58b0c9fe34a0671135784f601d96ef74b84eddfe --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9cbee029b292e71877252acc85ed0244e80d44e05f22185b6efb0283af463f6 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..29749c70b835aeef071093aabcdb01ea4320cb9e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f80435b5bdbe8cb312e02c361a2ce021aaad582e1fb6af86f4f18158d30e441 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d1b9cf415e908d7d299cb3eedfd6bc051e7609cc --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0ebc409271f19cb654c2b6312a9a08bc7046cbd21e7648b1d2249db095b3b9 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4bbbec0e8e4db1cb680e9150a4d0348cf04a94b1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:279f0026af18677fbd0588a9d91d022ada1b8a73194670f43690845752d59b16 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..6931a22df1d8cbcba6968e8073152450caa356b6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a91d78088321d6f6143c064e4366af1903d262c87e57ce0265ebe554ccc2995 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8514786eb8a3869f1e7dc21b23303080a1aa391a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc646b63fcff5be02db74dcf37f7309fe13792a5166ee029ab824b5b329408b +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..65446b14a63a008044fe9a90479471dacef04ec5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6107e812208cf7da9428fef1ee23a5571501248db958428655a0dd6775b3d490 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d9c180e8225b4907f2fcebf9ebddca0307df3946 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b36b599c8aa60aa9ed85cf4b590089b62959d468424fee56434e0f1694909b +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b6145eace6b0592350a8d2ceadb7208ceb75f71e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_15_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20682ba918d8277daca5665693bba1e5009f4547848e38c261c2ea168bc9c5c6 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c768eaf07f461cbc4e13739cf863bb6d3914d2f4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de99abb11e3adc7f8192d6729eabb887973aea97ff26c1f4d2e2cdb8e89f469 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2b12a8ad924104c214f03b40c7edec7a989b19a3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1e80b01100f802ba545b038c139016d542e5b6d68bc619416d5c0e1421fdd2 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..354398a957217765ef895756d422237eb8667506 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b97a3b4ed0d588b48c1e1638312d93ea9f9cd447079decba48410b3ed3e5311 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7d76862ce1628ef55c75a74c806122ddf6f92d67 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f256dfb2eceed5b4d5a40180f15c6a02c53eac7db03704790019737a0a16ff12 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fd39546b226546588c0f39ff653f8043a3225d56 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b80bf9a676449f61b9e6fde739d63d255c696b7351a06ca4c11d8aba79679e3 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f002c40bead001ec42d1b37c337b6a7ffa6a5919 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882c9635040995a9028f1bf3173b39f4cdfabb1d9508b25e151495b0997f83f8 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..42233365e02f5840f937e0dac24aeab6a3b6e96d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88fb62c381191014141c3856f8e0e13eeede63afd286e4696f578ec4a9b2d387 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..de6003b2a65cfb27cba9519fa49b5466a59746aa --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ff668fa5137542f9226643409158850d53778cb696fb248a05b6d166ef4082 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b9d46b00d65772313da99eb10ba3ae96b36bbda5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_16_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05078efb3fcd351a403f043e052f9fb6a62d22d9906dcfd87164102945a923f1 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c6ee950c912f5d3fa355dfbd1f2891ef1800cc66 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e833d65c0571c5b9056d89af01e1cbbf78cab4e71d16e6ecdf745f52cce8973 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fb04b7b20b0af8cc77ca16b621ce6a165d51ebf3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0efdab92914ef6b03353a8348952ce115c33f70d11c9ec58d59681716c65f048 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fcd51ce119d6b7dfcf5545ba9470b2ea45eb88f2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2715be4f79b8933e974fdace4f4a43545c4aedc2401e93b71ee57999060dd087 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..727893d225f52a693530be65667c1621445c86f9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:988b679c3f46782259c70543b605468c5202fcd402baf0147a6b62257a5f3b5c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f372d1e136add083ecdf5b96031383da240a06bc --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ade7448c512c4bffb84f72135060930214810f6e68c301b045107e1f555e9ae +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4fe215a79c52c5efd3070e4a826aafa72d5281a8 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0c628fc4a7bcaf39c48c4130e0ff8b9831e5cc87abb90f5b5cb02ade5ebc4f +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9077ada5caabf891e7af2c9e921dfa4d0e46cebc --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c06c8fbb9da5ed31d0e110ee452273b7b0ad365d752f72a1bf1e7e7fe8353cc0 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..56ac267a51a7022c128da95054020e27415653a1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c9a51583cec369821ab9bd5cf06d537aa5167c864d31d9103dd152810bca59 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3615c1e1d75fff7c90d3f1f16c0bbdd566e26e99 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_17_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba08947ac70d82fe57afc3bb8623fd51e435c030d440096b285dbe8c508f4e4a +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_18_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0c06d8c7687c59205326bd3931932a5cf2588785 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b456655e9894138d8ecb10d7a137913771866b6675881fca9776ef4f498bae7d +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6a91fe2b26bdcc5018c6023805a788a061fab629 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5e5a4069093f890e1a69be2539e50db267688ba000b36cec0706ebf008aad7 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..30dcaa2fd6f921775f9510fdcd4cba089a2081a5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:373739fb4a8e4091469dea057c5269b432d7c9c21397ebccdd7ee6fcd661266c +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..87051db1df3bd1f8a8fef26a64b94b759875522f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619763175518f0cb1937723276ab1b31fa3436bbc2be02487939ee4518604ddf +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1db9f24270c96d7a1e72f655deab334776102627 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4bb45a7cec557e21df52dc923e9dd62f41d0514015150daac2fad43421a77d4 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8ad77430240697ca2f4ec4adc13673fa9099eb45 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_18_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:129403a0a9383f182786820d2cb0a6606950540ee4d5f26299ce6082a929a3af +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8bb7741672ee7ea8e204877248bbe8d507ab97b3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e923c67927056514ee0a7f0f759a8563ceba221f2e2a279760440e9ec1d9ca60 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c57603806a36c657f94381f21726c94cb772a029 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1838c3af0979d08052ffd72c3952e110f29613276b3d64af7cce10bb85f08ca0 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9e793a653df2583550e53dd752543b6c4178f51d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0623352bb9e5ba1e7b0fd01f8a31eeca2e938cb6d86dcdd4a5bfe2f09611c9 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3139954076f0b6e374c9071f64fff7f9d3007a19 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f5af47c2a355907b077a99a37f8ddbb437755f7e03102fc651d6be36005f83 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3cb4b4999a638260045a4cc1f2d332afdd434c92 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4703f6d3e99e160fa6d9a4c1d81abc12f18dc12ec670316467205f135325aa +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c24b64e95d030595a8c6371e896053c82b7b7ade --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979894c3d196804708ebe71714f5c138b1e9612c0cf0efa968f8ee26367781c9 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3c265e8a6c00783ca00c363c7ade6f7964056195 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2b37d83bf49ee9a41f29750ece79f6c53f88981c31a40ae7bb387456d7ae4c +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2a87c50751cb7240b4cc48de2ececfe3bce7ed6a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe124a4fa70820ac2dba476225a4daafd6322484c353cdd26e78c89360591f29 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..33a6be82c9429d8b6a914f5e45303a0b0d7d234e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_19_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e0db7daa42ae7fb667feee8f99ff14400a04899dabf8df2fafa6c31aa008ef +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3f67ad6e9437626beb37e8969fe7973a8c3346db --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589e41ede01587c2c49e02fd584c2cef67dfc31b4e5f6d3c8e9a78b5b4d2529e +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9683880d7278b7a8ba1698b7f36068a56609f19b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bff39fc0031941e0762cd0fdd948a0f790acbd4a9098eb82cc4a85a9116f2ad +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0b8e0db45b2fd14f2bcea33faded070d58d76455 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1cbab5080ab62fd1652a7d5955a437f21afc2f4e3494de92236fcb62b125e5d +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5c017358a2fa34eee09a0c843309e49fc28dcf81 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:989a8c09e5207378df9e0e0bb3188b2568b99a2785745346084c5a90ab42a352 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..53c40434fe4acf22d7c0ca89ddd76b2eb6d86e9b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e37a61e343f154c091fb9c57adddefd68735b4a711af30bfa8aafa0c940d9a +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d0a04769e786ce2d4bbe3658c4a3fc3455a1858d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c790cdb6695e9812fd57fa22859b4814fbecbef0ccab46f7378a2ae3de049b +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cddd551484c2245a08e809ab83456bf5e5450479 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7a4036b92f70ec87787c30deb1f5bae413307e5f506dc04ca18aa1cbaee49d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9a831c3de8c3dfa662a7c8163f989be2c28d31bf --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_1_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1823c9abee6adeb46a90c7d8f03437d4f51ee47549b4b336ea7093484e45ed50 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..83812e85f11340d2612d48a2cb392a0e4878e9c6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d171ac693d3cd678a2a68e05d3ee6fce75d2d64f5be9b040d7e2e9296b01181 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7f4b893574c3f2f811e19158b6e2ef2a6ad3206f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0d861cec390731c20157a3397032b8098a292c45f9b8fed8f092c5e08b1b31 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f3bb73da9eb5e6ff022764d4f138613b188cfb88 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcda2358dcb7811c75bcc3a138197c25e82c474c28ac078d2e16a5edd9c14621 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..1b9652421f78951766db92b87de7bea951157461 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4bb2afcb2e0c7ed2d6d47480b3d15a5c0779747a10a7700dfa6f746d016931 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c8dd1f8b406dabf5e25203e5b6412f24b2ff9bde --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067ec6855550cc5b2b58692babf4dd3838ce04523c60c7f7d13ebf5d6333c164 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..aee7c82e31cd1199fe1016aa5d20919d44052884 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6c955e760acdca99ff492123e3bd91a2b6de38c726d40ddcfccd1c14914a1c9 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5a117f93bf8344d26c3b9eb8f4ae82bc0639d97e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cf56169562bcd5a48fc686d65f71a071b6dbfbe3f974acb32ab62e5ab20146a +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..74c63eddf2375d71db84c6097d713c39add8d7c9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea0e6a9d72f25762e356444fe6aff1430a7cc0472c582936627749cb2e669d8 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d225e49b413084d2916be846769fa8e8685d59a3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_20_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bdc60d35b674f8ecefc1f7ddcb12f8811176356d80c006f045bb8de6e48d25f +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1edb2371128dbbd406afeb90e637b5d7d78ed76d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54812d9494767a3ca9e96f315bd9edc3a534127c711d0a9c8afc9885bf616bb +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..11b348282f98562f129eeac84f6ece7dde93be97 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12372a2885edac32c7423bf9d747af08e5a2bf72cfa24ca47566d374c27a1576 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5b7f17298561dd363aaefbff56a057b694b96d2d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41bdf06ffe91985321b0e80b3279b735d6aa47e5e4c8b8972e3d170be7f85120 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..40d7b06c8a99edc0af177e71b98efb251de143e7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3bb53647bfcc7fc118657b11dc5406f462faa814c71fbbe76e1490644dbea9 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..47314cf8dd8a297ee41e57de6c462a04335dbb3e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d6809ae588393036438acdf67afc1b5649d4398e8398157742cd3464fb25eb7 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..1f337c0efee94c1a455277e792b85a2ad1c93b58 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525a64c706e9bd76e3c861bdaa79498db35a5e7e78234c55832f6c1d68bdbdcb +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..62e6fec787ad2da258b23a835e9499bb7d995842 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:390f36910baf1e23f044fcad25bd18f2d538b8cb0c4aa0827824ec618aeeae8d +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fbfb17dae124fdf4b3a8d0b1a874e27587a52d73 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8073e43738530b8cb81fa29b65cc1f69102b2a7fd6c021e2461297204a6b54c2 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9f9aaeb322c8f93406a291d0a53b5b15c75744cf --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_21_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f59a94504664e1f1fa20d3ce95cfc88a09d1f0c1c5f4c5468e2813399ab2b70 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5de80011dee67b16e3fb30e424bdc3216919e634 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0ce0d7ca9a2c2cb378a7a5b3a1a59c445a6860e6a5eef62034b4b68eed516c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..df93156ae98518af92abf47489878fb4ac5a2192 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9862e4002298697a0c30b495e99977cb9e45c127835f9e242b790e6814d018a +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f20c49a4dca6f15989157ae3031f293d0b9a67e1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47543abd51ca8be93ab21b2f7690bc99e524f3d32815cd216f15023e81ce22e +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5cec4af4d26428375c10266861f60e088673cde7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd8cbfaaf694e1dba975537f0c1f4a51acdad54a469d01237bd208d4e331834 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..de4cc58ab746a2c81d89c6a3839045eca852eb2f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31559e7101ac3f59b3e451c8123a0850f649f815f0dca4fd27922e73c3f0eca5 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fc728dd4a2d31b2c33e5455f8ce2372b675f7bae --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1614e4b194bf05e450596664a29ec9e8f56e8e72c7590b899f1ef56501679b +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7f916371ad76e36102de363b975794ff8e28e05e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e00a1d94287019c45daa574f8df121d574e7aaf06e75bfb27d0d717b0e6764e +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0e33ab4b5ca2b0065a9240ea23ea28d99a393e85 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665486123554f880dddb9468a9c7a0c29e6cdabdb8c098d75cefdfddc79252b0 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c9b7fa30151daa773d8a0dbbe75031b98f396854 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_22_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9650a1e242293c3080d560ee0183d95777936972d8d5388196f2510c81d2e4f +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a9be645658861ef3e9438dbf3b938aac3d472748 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78cf2e7f4e0f899c5f06acaf032f26dbb457a867734d3968427c2c0a5aab1259 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..79882119b283d9f7b97334282d690e6c2fb7ad59 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f24fd9db33c2d6123261909db8b9614ec46ef34f29b37813c716cf662f5def2 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ccb3b4c642c14a10c23cb7adb219ab8d388f169c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3169bfe04884fec37f30d9bfefd3b521d3aa726204de070831da5167bd52f31d +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b5c03e70ab4a53e7cb8585aa0d6dfdd9098fe3d1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315791a13ea0ccde17203966e9d60fd91bbc80d8375c19288f83421249d1b1af +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..078e2e0930b34b36a72165c6971588368d74139f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20503672ea40c520cc4f8684135cf8dc6fa868036578730ae7b9ce4b35cf130 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..9417ed12f4f2c944821f256cca41d8832def7dc6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa1268ad7f268ce90d0844f76683336fc1c36e7cd22383b3595bfa08356de116 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b035f267e062659136291e05e4bc5b86b83a93d6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_23_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663659a48137f2b96911849c3889ebf53c838eea1ece25eb583ab6c4f989f2b6 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f0973a5293c5c8c35df7a951e7ac741aca1c1349 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f24643ffb1649f623eda188f50d3dbf1f526a0cc283a46c5ee31937b0cd41b4 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f2e9e9b4614eb821e513bef3b5dc9f28cfb4027f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7eee673a2e359aa434585e9b12be3500b077190bc19f9fe24ef7cf4c003677 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7dc3ca75d5f8ea824f7cf24788413619a09e22f0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16da6268ca5923ffe4e20dcfe24b119bbcfef54a6415612e8222e74232255c1d +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..651b1fd6d207e75330c2c6ac69d1d33b6c394056 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31df0c8785ac62394d43bac9bafcaecce345e53ba0eee23502aa94d1a8a40ff4 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..75a3af2bd2631c1f95c7dc767399de17389eb66d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea3e637faf43a21509f6ea2b24179dc07c43c6e2c0a51e168fdd5748ff2d0a9 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..10755819fd9f88e48eaa0dafe04f330bf06d3d0c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515697dcb23e037bd876635755373a15a68e8133a91dc98fcaef80e23f811a83 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..06190beb293637bf388f49b1e39fb278b1a8de41 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2d67b39b75ee935c0bfd97333db65c673ef84dae1565c4b813df9e4beefa6c2 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d22edd390525720902315cabbfdecfee80093502 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79e540f2605a86c50cdfd8c3792abcdf9d89b765ce272cd12e048037af610df +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c65c464587f8504d8c2c4336df9af37b2956723c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_24_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830f437a0622173ce3bb2b7999c386ccffc87993d26608984a08498090ff5e14 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..37c7af5fd1588ece6be40aa78b5758848f6d3a4a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b14c9ca72e03c15804832cc3316445ed513cc3c397ed96bc0e44615d5b389b4 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..aa7b5d0f4acb492470d12e61cf9462323445b74d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c992b8874ca61a58fe4f20c889bff0e26c1a0741cf6d30c4ae1c029af1f76f14 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ac12b0441f09295e496d3b7f617c08dae195c6d5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66522d6932be32d15be4e5b150184ec9e15e8e355d23167ef184021a5bba87d9 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0b2749654a7b6e68b3c5ceaf62a22a437fee961b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf639f5d45bf4d7bc603324688f7f7c5ec39edb25bd08b6c9daf137d9aa3e410 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..deece1dc8d1d2b1f885b1f4a94ed1458c8b9cb24 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d6cadaa0692281b14456fe9dd63f980eef9a8576c0e0e167d9e73b91819033 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..37a8d3ce2500b9f38e6e8bedbf555b62c278a363 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d9ee5ad2c4e3aa2e1f52c4134ef026fbe73e9f835e09b688a585c8a5a1991ae +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ea157e31f0c7561e50cff2b65889a40fe805428b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_25_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9ef4b57a2f1a87bf41817489f057660bd95a6cb6ff76a49abedae5ffc76111 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..695aa79a718ffbe187f75cb1518593a10fb3b3a5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:786acec89f677e26934b97a0b459502163256b5262783cfe4d1df7887d205e03 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f3d616da3aadb5b913ebfd5718c3c0d101cb5d02 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a504d4186d62af43335cb420111cf7f7d667b2f3f195bb1dfc1e6253417e3890 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b57709bc60c237b1ed28cc749acd55164981c575 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ed570b04c7bc81ffc1c0d9a884242a4875bbbfe789f8a20a1a14ae345b3a5c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0409bd00633bab2f10ee42a670b0aaa928d1d462 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d935082f2e41a6e73e683738d5605eff4ab539a66e2f32b35e5246a65a134ea +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..af286a4b8edce1b3733e5c66ab0c886e7cee1c7b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be878ee8554f66403eef4cfe28cfae3e4670a525d857bbcfd025f00c23d47899 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2f264adcff2c238e1964b44dff0793b963a032a8 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706a2c2c86304e920fc02026cda6b12ff60854f00bf633b22e41dd6a56fb7e94 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8213fccb4f230a8e8be76b52cf8b70c67f9be8d2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e3a64062df61c7c8a313ec36e32d36ba5b8971de09f6c676305bde6ecfbfd0 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2f1941f5fe72924d8cdde0cc814da3eaeaf198e3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_26_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b648135fb406dfbd4e8235c558a70f808b66f94d7be02b70efdcd2aea86a5ed9 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5a3fdf93f2f0721185534bdc7088ec37cd94895b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88a81f2f4902848b403a894986e7cc95db5a0b6dd62a1f46442c48614ddb5fa +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..89bd288ab7d3125057ae9e42265416e1001f89be --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4c55a8278095071d55349ae521ce955aca37f48be5b9e7e47ea371a8ef31903 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d2aa884db3af4baed1cc6adc843e2c8188ce5f94 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372ac41ef8245b6204e6366b5616baae3bc50ac77a596c1aa5480bdc9ef6b17d +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8e4dafb1349ad592231d59f342711af2eb717295 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:060550a592e6468274ccb858dfc3bec980ead17cc737af9f493de995347e38df +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..91308d3fbbc3d5952d49dc065a700e9f57d03d85 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bc29338a183f75dd118751ba6fe85355433e366e3833a53020836cdd0a5ef3 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e3407f7a850c5ea586dc748bcee7c81be3427894 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d68e3d15322a6d65fa580b54fcf597d2143f34c37c823dae7cbe839b4595438 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a9f974278983a9195f0f124844c9c9cc301a0b5e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71dd1e6d6675f8c3e3cb48ec0d1c8d73598421379e12cdef0f3216ab1748a7e0 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..acd95b233d312228369768255691d0bc5aa1764d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4a987203267f607a231b9eaa9ee4ddb0890754408d745deebe3c5b0d0ff1cc +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..18c80574517f2d7786a633703a7d2c52056ccd2f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648dc6393349bff2776d35f414eea6857d667991e5b1c1fef4d83308c60539e7 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..80e3e7216ba430070bbae456b0d0ba7cb0805405 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0980a3450a28685e684c187c08b576c0ab8000b34465443b16cb2977f284904 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..76a11f184c7c2305d7dd1319867325d12a14db37 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e7447f8f65564f0d5b112e7d2ce5581d928f5f121ffb4445c7fe60e0056bf2 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a7c32ee36637e5f1e4ae87b208952364de8b76ae --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74fc43272a7efb1517c68af00f67651283e0a2ff078fa6f8f7f5353341a7b206 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..aa0bd2db0d3cdae4a9a34cde764991f42de67203 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd2fd83b17ee154e98d9768fd4e80aef7975692ca3fde592e26448be0d4d617 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c10e9ee5733e2e838625575548dc574ea7ec883b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_27_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dffcb89614564073e42a8d2793c2a8e06007d21f14570e8c14ab7239bed7313 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..68a806a64a40a8121c051452d97ead40c01fcd4c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f5390bebd3269b5c257b711fa86fc265f9ba730fd16cd186bef0517a5dc667 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cbfdddebe20f451510987a1124ef6199dea66dad --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6777962fd7fbb34db9dd9f105c49f18af55197dc46294c4911716d6e9d6215 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..820a38c6748dae76b97dfd60d06b10ee08e49593 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81893bf1697453898cbc6ac76fe83757a65744214bad05b9151cc7b3269a1eca +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fe3d153857fbefd16c286c155d5edc7867d1a22f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a6aade11f2099b087950297ea339c8c02e1e5b9967b1b2d55144832da24369 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e2ee9b08343cf498592afafc4d25c4c73636d7ce --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e028235863d1698ba0e1d210fd24694500ab208fb4558e1822b2a8e45698b3 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..2b27401d196a6b789284f28b65f81795141aa2e2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0831f6a74bf8899c8648bcfc4a6f2df158f5088e70ae647a806aab4baa81bdc2 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..dbfe1f3c253c87cb941682a27fc706c92480fdb9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca0d71126590a15a7edeee3e034b7d27a2047de7ce41dda56dd4ff4ca524443 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d4e09dc7315e75e24d88652859436cad8bcc08ba --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_28_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8f71b61212ecdaaa10fc2600a463da976ba3a7a2636b6ec3022577ca2158f7 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..566245eee872df94fb9d9a5929e818964f34a228 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98e7854834a3226570673a325d57d6b88dffbb3deb9c746cd75e3ba115d5a331 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a8a3b68fa1ff8d6a5443f48927ecb6f7cb11148f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d3d1f123726d0ed8e3c15650e8b52af859ffc52c44bd10727cd574835badefa +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..94ff127144e9bb79942e86691b2b6540dc79128d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16df2012a399408118175bcccf9e4a16179fe57142bbc8b8a8d43c2cdacced5 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..6c0b9e5c4fdb99afc3e50a5edcd7015cfe5679ab --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f4247f497d94fbf09ad3cde7952bd6d976a251e20e13479b3a4cae535fbc98 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fd643f717e6f69d69f43e2d3209563f2a2d1a6b4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12610e13dc86241eff2f757966f715cd091ce44a78510be236b6b8f77cd059b +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f28e027ce65b40ecf69ea558800780a101c4aba3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef1f85f8ef8c9bf798b8777894cb22b5dad5e71d74f2adef36f76422c0f9191 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..75bc368a206a099acbdc6989e2881c0521265885 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6935944e23084695e8bb973071bcb21e648c9adf967e2a63d63da1100f3f5c83 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fa1a0ad99dfa5bce5fb9e136b51355af40415671 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_29_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34bacdbf0e5c74c8584f05abb9567ce9147cbf9088fd7452033b9429094aae23 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0b172da6546b272021c84c3065bc0d096167915d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b0833531cb0bd648a3060c993338c629b17be1abde5baa88693faa977689e87 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..faee9dc7e55078a4a6be27102de69e15d6da3ff9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac734fad77c8e2d98e18beeb745648e0c1a4c2cc25a1ccb394cc99041025a15f +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c22301d2e8f785002834efde25b9395732c51b76 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308a54d494d8ca3ee241b6b40f3301e1cabf79b9b64c24bf4e5deadcd6670a6a +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..169938f282aa93475dcf33e15d2a27f9510ea43c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1023bf75feda17693043bb9801e140cc82f140a31a78ce98d7cc30aa2e16369c +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..276f3437c403b2160a024ab714f4b7c3b745b507 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258a16ad5b204199a4d6c299452121d79bcb3d4415c81c44000eb52c5ada818b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..b976a36d6123c72f753b845bd75abf9ea83be0df --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38dde940c599779c53fff6a5ee9267e75cdf98b5d97889a193568f262fe722e7 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..fc2060d683cbc457c425299ef7435156463d826e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4305386ea6638aeb2d92176abc236aa5e9356e16882de893346dcc0a1c3f225 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..468475d4b14e4a4914fdb5f38948ce84fbc59ca0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfae7dcad1121ac38df28cbc9a49d60956ac23e9078cfee0d19cfe08b247ec4 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d370bcd2316bc775313979a5f189a8b768ff656e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77660c2da43a7a95c96dbbbad5eec1b7d8908da6ae69ae04483c9de591f659cd +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..866f7f484ae28eb9f30c21d2f65facfc501df1ba --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04ae2c7c310c4fffce551fe7c7070956f3dac715f87b4ddfa1d2fa9e6be51243 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c9124c14d5371305e62d6c45323eaae95f0e2bcd --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_2_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ca6fae784312e20683def021d9855a22e363e1ed1cfb048a9ec96deed1b41d +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..10b5ed847f920fcf4c0be81aa01d2a95a98e20be --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b470d018d63eb312395266777b46b8b3423c929246ea3c0f8f9c031cf02c658b +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..df8e1cd50d38739e6430902bb9841a8330a045d4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756db6e79b9f2099bad623cf45fbc42446ca8e9ab517e6e5b89570f49b69a10a +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3d7dd1aa7663b78158932371a8856303cbd41f30 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e2d6eb60687b5b4b12902522f6cfea76b3eddeb10096fa079923643be3cc6b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3300b381ff3fcc890ebea26d8ec42eecfaa20286 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ece1e2e6e2a225fd0cdbfbf7e8cfba7f6e367a12e0ae1b45d0b9f1a654af98 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0f3ae547ff4b3064aefd5350216f77736912c425 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc9409f208dade7f3b32669b6b928a94bd0beebbaac3b6585fb04225d2cfc68 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a0aaa28a1f04045f59321d7f4ce43877bc0aecb6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adb169de7035330cd157e8c7f9ca14ec1e4cc125cf38e570df7408b663d9a5b0 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..19b53c67b348044d902bc5408717571b38e534a8 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c7632ac00f3ac69e8d227e104f7c248572b162dfd9b54c598a01bd617280c8 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b1bd853ded2f12679fc6b59adca80f544b1d7339 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_30_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5420f773b56dc060076cba90c4b3e1b538b77581e7bf86e5ee8e847fce1293f6 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9e2315fbaa168a0ea04af6a7d480bb2d8e159e59 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65e80ad5289b4517b04619df3d963199f652192b49609616e9b3291df7abe07 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cf748a925b91c3ea6eaac21ff1e6935424724894 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dabc472a3f2fc8d81ff5968cc5b52f24eceb6a8ce8dc5a064a11b1208f9b68a1 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f3a7bf5d670495c26dffe4d0ee9d5ce581e4b033 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c72d11572f780e5c2f485dc99f827f47fa145b1264044328d920a1bba1d8c25 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2da590723ce8c9adde99b0d58a69264e3fd1c33a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba763bbd7c6a870ef7bc5b5500abef0ffc911ef123874655efdc45192a455bd +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..cc78020ba89d88ac6bab95126242559d55df023a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6279e1818d831fd0d6ff6887f10b9d5f59bd5caf808aeb6cee187ba24dd3cb47 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a507ec8bfb546052880b317ebe4db15e07674a6e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6023dc3481d4dbbfca9c26b1ff9d0371e6f94deaaac034925c46d66ccec137c6 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..edbd2f196498c4ffae6b9562527d72a38ec86945 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3214269e4137c12f381d386456483c4449cf244e7000b47c1a6393c2b0b8d22 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..317e0b78be68602ddd798592d0586c3e1b38307e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169544209699262ccc6827994ed4b69cd4681d3a453bae709d73ae76e839cf0d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..b3c9cb778eac2fbd1f2ac9f67ab227f7dc23d7de --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b75a22a8739828b64b7eeeea9f83384a96a0f9b80bc93d8ed95d6237fecf485 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2ba272ac050d7afd32ec3db5c53a7822a894c8f2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_31_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef78fb68c907d3735359b1384ab9337f423bcf345904c1bc37a1f95c097df223 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4ced4d49cc98e445cd0c5529cec8615f2f9bed1b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d22c885b44b1accab26e23e77281bf3c474e93741f9d1dedac47f29d0a419f +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a911f46652004cfa1e46cafd9b5bd6629206b3cc --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb664b7ef24653ec6cda17d490aa21a9679644780f043f41014de04e630d0fe +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..928ea8db4acbc2fbdc08fd1b737512e563c7c5ae --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e9c99e302bafc24de6a3263487d09123c852ca23745c8f40c27b82882b5a2ef +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..159dfed0adc8545297f2352e6105750fc06ee423 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed1f7d405939a3c7917665d6a0369e85b63fa3edab1c331cf6e615fcd15375b1 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..670359dd3f5dafecbfc0dffc0eb20affcfc848f5 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b753472b124bf80d29ceeab637a3309bb73c5f54dfff450e402eabde497d1d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ec7715bbd82e149357b4249692d52683b41f7aea --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a205581b18289ef29a2fe94274195f6bf0b1ecd9b9b93358af8db03b11c556 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8d23421c09450b3f47208ed21335a2ef3cad6c2c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_32_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b668f41005a2c5d2aa53279cac2a343780bf22b52f31687682bf28aec6089f6c +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0d384666fa57c6a8ffe6b6b1c33579ebef07b54d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb20085f24adefb58cf8133140c57488e3103d8484c09b830e6cdc05c12ee0ef +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ea1b2453d4c85cdd131e7aa261dee8719b09c3ea --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c49293b340e36c1f3b7e1b4f8bca151732b5517a64507a0a88199b280af6f9f +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7faf3067ef2dea3b6dc0cc4a78eef85b7d845f59 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36c18a9ab7eb8eb721727b15c59fcae39338eb0d08c6d0121e637b0f4d157f9 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5e9cf72289e8d6d07032f61c2af24b0fd213ca72 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd673cfcad7939c07267ea1efda1697f0dc78b1fc6972bd1d7f58f030fe9388 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..bba186efe49d4e93462f31fffa9ed55bb9a435a6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38006906b52f10c1d473faf4ecbc2413d9fc10821a240947a83f7d0f0a5b5720 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..b89bf2dce19c59b4c5b26c2047070a3f0faf1e56 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57e502b4de0ee7c37935f14702dee51a315e898dbfa614d7d63aeb32b44ec56 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..23f4cef7e42ae3e04cf7fb8b645852ce4518501c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56aab2566b799d38e7d46028d157faebb31b3662d00e741c7517e3726ef3b48a +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..1d228b3694d5f701b261a83645292106c57a1e9a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e3f424c110690d83f2d272dd6300b39f9ace18e1231dfde1bd4c8fd7df7728 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..821c4b0775e9f78ce2cc876a58f9c3e407283940 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85948bcb99210e250163aa29f6ae6bff383172cb1dcabd1d58cc6eb9f2315635 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c3bc121eb1597f21e9b917885c08d07ba3b36069 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_33_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7343ca4175c2cba0efc05bbd56269ac4be77866d7fff4b542964e0586490f779 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4f151bd91ef2f44469ab876e3847a05b4b3b644a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc26b31ad4f4fb5bade895b58946f4e73b9e01e99ac90cdd9b3c7fef94d18ef +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..df4a8dc5d72934cce308f1c5b2421dbf522ff0a1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517c5bab37c83c1ab5f9201f55f3c79b74bf9415946e8281428e722beb2b89d5 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8736e2fb160186b8af5f439b3636538483ef9417 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12d6623f6694d5275ee3c2ce59315beee6640e9652c9f74d552dded9f6e1d57 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ef3ab52d9b1fbab10f0a822fcd2b4e866d010da8 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c9cdce9b6cb19d9767bf7055018cde55c39de82ec563d8003bdfbd2204a172 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d372d5b39048669a170aa9fe7bb31c95238438cd --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f69f223a70f0bc31700b9c07cfb0141c3bbc0aa349d1713cfaa43dd73f3cc97 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d6bc5b16ebfbc9c72992740dcf28d4010b6f7281 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11161f0da12250f93265eb3cee79cdf804a3d8768f088725280e3d70b9adbf58 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..8ff4c687086329911fb46fd8954e434551c9ca9e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e983e2a6932100f661593e9d5505d8ed328d2f4b336f9fb9226bc1fce080b5 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..95e8b3cd93eb330444a5847be4a8372ccfd975b2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68e86af807a58d2c3f1ec4b4f0a3648dd4a6e9c41ef70c4137bd9ccd2c2c8d4 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..64a68bc7240f6346055d5bf9a843c800ad074c32 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_34_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6af880024c0a554e29dde6e2d692ae2527d69f567178cbe27d53adb6ae4869 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6ac8865902716a84c18cfcc49d4399f719e8d56c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4fc5785a3e41241ea6b87fea9b9662aac0e4574694c7c9159c290de7c4b56f +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c37100fda703a645f3e0e07cddef0c73ba880470 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ad400e04378685192df05dc2396dc05ac97390296278cbc6ee4b83b82701fd5 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3d816516175675b283e7a04d074d4976d71da4d9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa12960390869dc0cfe76a8c10dff17bb7c5af0fa62a086733dee14481034084 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0ee1fd1c11543d60292f85d08d3f585cb46149af --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01649ce33ee4e815bb247b5a4c09416b6cbf0f613b80394e874fd6e690208413 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..de1b18974120cd948d80118b13b599e69bae3378 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ed079fc03ed3b29ba80d7870686381441c09f92bd9c273a505a79793ef335e3 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..487289c12a4bef2b8b0a953c9b73e2e4f2d8e55d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92ac28b434971eb197cbd945b6baef4b63dce776b9828a8c8014dff064a5446 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..655e0d6097afd20d657a1efe0d6f232b02ab76d4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90beced3c5d28b047ed63fd95aebd9a84f97413899e9a020f9a50157b88c9cb2 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..6c8265c823fd58c7f518d02073381f54722ab362 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:644247d8d837989b4b4a155a5e10d2a6eb03bda111e0a66e27dce0005f82c04a +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..cb5f4b320a868ee6a6090a9e9437c8f99e4bc8f4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_35_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:546ac4899bae84850c7511df88293bad6c1067bb50fb7edd50658662d9ff4a63 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..06b97f4879689ec7614213d7c2be08faaea7e2f6 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca3be10aa4dc5c029c8da05eff573c79f7de1d93c968729e894cb612b614617 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..16c9d842540afd4c645d6831ec5bd862d70feb69 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5b99012ba413bb293bba3ec994bccffe6eb2a3727ada97d6799d6a32768d91 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c922c4ea7ac2dbf18e4731b5aaa54303867e1e86 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dcd7b7c7fa79ef01629930c0da52009b7d096cb6ee91006ce240c2bf2554687 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f1214154b76f7447b76c645d1591596918246cd4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6606728a2eeaf372e835cb997a313a47b763392260d240119169ab571c9c137 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6157b6717202e13a3ab821ed9e6c334c61890375 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb46403bb0a475da26b356b3085952412ee2272375cf4017d2ae8aa3d50b403 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9cefecb04a31672784b82878e5c366657a57b139 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aab107dc7022ba7bac125043b90b246f0d6cf8c596b9ed2a49e913145bb289d +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3bd6f7ae4e10c250ce8ea4ea569c2dc98521fb7a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0784ae98c60f4369b8d8365cec311f2bdfdb921787d91ddff00f037f12700d62 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c6755164d49d6bba13fe4a825eb476d1b3f04cea --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5edd9b179d49208d47485e525f735a27e283464750be91e07fe0bb83766e42c8 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..596077ddcd558fa04cbfef1ada0c13806538467d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_3_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4861b263a0f61491e10da90b2c26368d5424bfece7ad7a7d3686351b9625fbe +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2d6771f71b4a72e56f4eee9efdc3aa863bbad2f0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d5f28f63640eecae12d8d2891bf58386cac4bb0d5c266e580b35ae571fdc546 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3cb4c623bd27a76fe894dccfdf287975d26dfd88 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dbebb09d07a6549a2ed8416fb59c2b77ffe1f78c6af07cea663f648d0ed88ca +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..97976d80fbdaa0d55bbdbdd7576ac0491f23678c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de04ecbe48086fed982e1b3b7676bdbeeae8a96a2901e8aca4a5002dcec8025b +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..48b357a1073428a371ff895bf1501c4ca2bfd29f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d024dafd6c1d80d86ed57fc6faa44f8ebb4d6d820d6157dfc95aa2a28ae01ea +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ed0d6d44dd51c9e78f0475a231fbf755c1efe5a4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1c614221d12d9d659827be725c1897924a0fbfb7b7bdf189c1b806bfbb314b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c09ed1c6b9ccfe58e6571c48021f9ed8d626bb2a --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83109eb8d6f2b9a86419923c23ab5b342f793a95f494fc6b71ac9e57d98f4c20 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..166b1aefebe4094fa3c6049339139d8dabea8f20 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24eb0d8acd30205dc5dfd63fb6a3d40a54e5eab5ab74c2ebae84fea36f0d00f +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..69954bdea67bee0cdbfb0e3a837373525248e594 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2522758c13c07cf0194ed49ad6e3534f9e8e57f3d35403db19dc8470735eeca0 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..45c0687fc9cc3723d2c97b5162472ed4a5039586 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0f070ccebd2c7397e747b9b6eeddd904562fd78df53cbf6746d419639e38da +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..423d3c3b3d3ad06d12cb044f0728fda791930ad1 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c85397215f585264a4e1d3bdb6bcc2a8b057046e049536088665cfb30bf2b1e0 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5571cdfae08155c0c5f9fd1f92b5abbe4e8f9018 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_4_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a45f44ef7a665904431d9175a737a7c7a06093f2020bc8bd7bfeabaa9997c2c +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7da9bb7b02c7271542105aefeb44d265c1de62f2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10773de6af8cb34442bce1cd1f92e21ff0955b8f18ae4317aa1b20def7da04cb +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4b1cb5fed319aa45d6a2088a6cfd03679bda4c77 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa1a15df0eabd60fb3b01947a9aebd9cf61a10a4b66f3f1512dbfb00ea9c921c +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..de53987579398b28b545777ad98901d0ffba3043 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea4f74dc560e6a9f9e96913d8734a0260f03a3dd1f11b642474bc39c83aa82b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..317242b8259682a6d13494091647bea60309786e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2bcd3d38b478e55e2a209036962756adff4299a4f91aef03bf75b7b35ba80fe +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..c3dcbb9772f999f4d823c2a4de9d48efaebff91d --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9221f95a3761f76eed631d3c638eda11edb980014f34b68f4dea76650794071f +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_5_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_5_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ef7adbfd6eb7493dee5e26f53fd137639261ebc3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf62c708d0898fa9c088ed62739e2a81f1a707b84af52b9846850e7852858df2 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0e2c4acc77cae90be02e947ceb8d5cc6657bd0b2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2a40eb60a87f7a3df7d69b02376c58b24030ad4999d08b62b73e6e3978f1bf3 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7025825b3599fd3eb37521006a421c17101263d3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dbb3ad937881784b3f9b7f2457a7bd9306571f082641a5f10e0e9daf72d6dfe +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8f184a7eee73578144c5e738e4c3883f31d37517 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf918be06f7e1389b30a9b0d3fe37f1f90c1c289888d9106f824452bf85f8c9 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0d35da8a7cf8ea9b9df402d9b0bbe5415e55a3c9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_5_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6036c5b18d3626b2c9835d230cde01b5a8f54d6a02ae78d1e6c6dbc77ba9a686 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1976700e81ee2bbede66a49aceeb661df5cb2382 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fca70c1c0c9fef71c695f285264357bace61c70b8487cde5e5816d92f3da18b +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f17c7ad1bfd19f8ad08eb49b76b31521f6664001 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75955bf7cfcbd439d5b7a8d5f35e503a4a9a04637cb87b4489935295feef4bf +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a1e1f676be290c4a9e8b8ae2a4aa26b3de2f5eb4 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92eba03c5b704e1932b5aa0ece805104554332f51efc69f75f4c630ced340d24 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2ec00cc83d8cf95ce58f1abb7f6ab51f04ea4f5c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ef48763c64eed1ace9c8a7fc69c3b14c2ca5129d49acb983d5ea1efbac5e1d +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8565a1cd2aead8f9d7902ca29424984ba33caaa3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05ad6a45ad17daa80235c549214f32eeaba9f69b402ac0c1c7109216f88a6cb +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ddcc0e634c5858b8e67a2de2eee6ad4d373f5288 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3cddb0409fa1313c40e151d7a899de986aef92bb4c61bf2800418fe6bb5b3fd +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..40bdf5515f0f5d24dcc0f34fc7f64e4867e2c7f9 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_6_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8fe97ba20566e1b27aa6794c1f052d9f1efc58072e287d3cb493f10f02c9527 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..b454df196fb9737ecefc7d3b0c1919af605d09e3 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6d689c8e0d069186f2fa1e9ba5ecdf3b8a2e64963a66d9d0eb2cba652e789e +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fbc1d8c2b13f2c98ec05975b2d6281602556eb01 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58dfd7dfb28b5e209e513f730182671cec5b96643448e9b6455225daa3083c9 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..9f12fa3c394660fc0e687162f4ff0c30f238e29e --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35973bc3b452e23f3ac449aca1c06570b46b0b8f3d025886fb49ecd459eea7b +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..cac20a5579f548fbc27029d102e397e0b9cae510 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821cabf4b6e8d89de307785aea1b7566cc776bf740e9a7cbeca7d9f09a0878a0 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..e1adc0a3ffdd6bf0d6cf078fd0830428e26fb703 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af0ee7e011eb370382aea2b2d3df96a33594101db731b9783c905ceb386c2132 +size 1310720 diff --git a/qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3a07139490cb8a112db0e530e459751d851d560b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_7_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c9b2c60f7d11c507bd9f402b34ca360fedc08c54276081451b5021d7a70c310 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..30c2495c37bda160adf52bae7c94976d4b01d219 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b681de219e0e73a3c1cf48ebe18e2f5647f3b15d9068db4d535917668d50e80e +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..468427387c69b2cbfd0bbec4196beba8235aec0c --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82aeeb884f9fe91db5dd64edd859c2d9cbc38d3d91db1b98a256a1590efd04f0 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..27de1df877a9a48b9e090fab130a85e6c8e31264 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a13d7473c60730761bdd2be50eb4f1ad5dae18fecad864592cec2e81ae952a6 +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..b3c4a0a7c9082fcef297e908aeacc5af534af85f --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a17117ab613e15c28d76b2420ad3e9d8d6fa163d814090499692b38ed6290f4 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f8b7dd84c7d9bdcd0f6b7caa7136685f1abaea65 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84abf94ec63214f0fbcbe770abe9804ca09c8d31a1fd9509489fc33a800b260f +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a8ccffcd3ae937f8b8ac1d253bae32fe283ae611 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f440cdb346a6eea41edcbcbd1ada3eb249ea47fb38beb0b921445e1ae422f6 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..6fb956520c88d1adb02e3a022ae2a1d9625575c7 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_8_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:438af986d45680a104d862cecf1f38268c0b54460ac4b0ce2f411d7fb21bfbb7 +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..af0db4952c8a387ab6e02763171aac313320429b --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8283fca7ec6ff7b9d9896dd04fecb79ad1d4d75768fe9f6ea91984027fc563fb +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2280b68cb3e212b6333c204721d52cfff4f693c0 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4332ece0e6c91d37d2fb93b15c86cb5aab53d083c47dc670066e6765118ad4b3 +size 15564800 diff --git a/qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..351a24f3c9c4cc257a53e82190307f77591ca4f2 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2211fc02216c79a38ac4a438a34d6c5ddd4148d382e498827b5522baf6f98b +size 3112960 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..206cde6bd46c15f4fb6a817d16a1caee3b95cd64 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c65551cfb652ff1441453c6d6b386001dae8935537e7a61b64b34a09df5c14 +size 327680 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c9eb3a96ed5b6e65d2b54f521f403d406dfda299 --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1af6feb7fdf7358dbecba630f941f9806fe53c0cee3f9796657279f80d65bb48 +size 6553600 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.planes b/qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..90d61ec9e848b3c9066d8cb49970eac8367011ed --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d17a5c3a51a6df7c80b68a829df0677f8a58ca29215f027065bce6dcdae933b +size 1638400 diff --git a/qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.sign b/qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7e10eb5ff053f342fec3bd5f964f5f3c20ccc3ef --- /dev/null +++ b/qwen3-4b-log5-unary/model_layers_9_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:242f1caa25789a5917bcaa649b32e03b3301712b51d476cca436be9ee69b59b4 +size 327680