diff --git a/.gitattributes b/.gitattributes index b848baeda59422018d85e80bf99f0394cb9ebfd0..9aeeaba43c2040cb78b3b4f2f8cc751dfba0df61 100644 --- a/.gitattributes +++ b/.gitattributes @@ -3263,3 +3263,7 @@ deepseek-r1-1.5b-ternary/model_layers_14_mlp_down_proj_weight.neg filter=lfs dif deepseek-r1-1.5b-ternary/model_layers_7_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text deepseek-r1-1.5b-ternary/model_layers_15_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text deepseek-r1-1.5b-ternary/model_layers_14_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_11_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text +deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text diff --git a/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_v_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f802f66e6b93746d41e2fcc658629febf5d95166 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_11_self_attn_v_proj_weight.sign differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_17_self_attn_v_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_17_self_attn_v_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..53d92270570fa0f72b452020f9e77ade7c87054c Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_17_self_attn_v_proj_weight.gscales differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_bias.fp16 b/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..8aba38e12f9ca74ade5997916a7a3bb25535de37 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_18_self_attn_v_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_1_self_attn_k_proj_weight.sign b/deepseek-r1-1.5b-gunary/model_layers_1_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..03141edd00880f0b86b88c6636653c35cb13e52b Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_1_self_attn_k_proj_weight.sign differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_22_input_layernorm_weight.fp16 b/deepseek-r1-1.5b-gunary/model_layers_22_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..754f2a4d90debcf3aeb44f2778b04eecfb1374df Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_22_input_layernorm_weight.fp16 differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_23_post_attention_layernorm_weight.fp16 b/deepseek-r1-1.5b-gunary/model_layers_23_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..82154a9c197746ddd042cfd153b56df23baa21a8 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_23_post_attention_layernorm_weight.fp16 differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_27_self_attn_q_proj_bias.fp16 b/deepseek-r1-1.5b-gunary/model_layers_27_self_attn_q_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..aaef25656c40ebbfa5da1c1f6dfb9f3a7db0db08 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_27_self_attn_q_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_k_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_k_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..72b8ffa9f34da300805404f021ef56459c6ce9ae Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_4_self_attn_k_proj_weight.gscales differ diff --git a/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_v_proj_weight.gscales b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_v_proj_weight.gscales new file mode 100644 index 0000000000000000000000000000000000000000..5513d6a121d63a3e9ab37d0d0a69b38a2e533059 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_layers_8_self_attn_v_proj_weight.gscales differ diff --git a/deepseek-r1-1.5b-gunary/model_norm_weight.fp16 b/deepseek-r1-1.5b-gunary/model_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..e028ca2722863bfa678baf3b160412fa384f30a8 Binary files /dev/null and b/deepseek-r1-1.5b-gunary/model_norm_weight.fp16 differ diff --git a/deepseek-r1-1.5b-ternary/model_layers_11_self_attn_o_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_11_self_attn_o_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..00eef752803b2cc0f617d73b874c220c9925ee91 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_11_self_attn_o_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f567c0cc701f6fc315e0434b53ae7b7ba8b19cad0f46406357ef2a3d5c44b46 +size 294912 diff --git a/deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.pos b/deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.pos new file mode 100644 index 0000000000000000000000000000000000000000..bbdb61e9f2c8cb2605f90d7c624f5f285c03903c --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.pos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0bb91223789024707b1f3c1b6ac92a9c54ea59284266a48e6960da71f54aac8 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..2132c18bdfd1b390baced30a0b902e334fc10875 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e726100bb59e8d0c1cd9a136a25277faad2a79fe9df2a7f17f6572fd504454 +size 1720320 diff --git a/deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.neg b/deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.neg new file mode 100644 index 0000000000000000000000000000000000000000..7aad07cf67cc16338e96b2af2737e8bc1967e509 --- /dev/null +++ b/deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.neg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24be988627435effb7e84cf8b2a59d76f6ec0dfc27cb1f4e5761584434735d3 +size 1720320 diff --git a/deepseek-r1-1.5b-unary/config.json b/deepseek-r1-1.5b-unary/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ad7884f93b6b3e7410463413372da14f2cc6cb41 --- /dev/null +++ b/deepseek-r1-1.5b-unary/config.json @@ -0,0 +1,13 @@ +{ + "hidden_size": 1536, + "intermediate_size": 8960, + "num_attention_heads": 12, + "num_key_value_heads": 2, + "num_hidden_layers": 28, + "vocab_size": 151936, + "head_dim": 128, + "rope_theta": 1000000.0, + "rms_norm_eps": 1e-06, + "n_planes": 7, + "quant_type": "unary" +} \ No newline at end of file diff --git a/deepseek-r1-1.5b-unary/model_layers_0_self_attn_q_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_0_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..b94d3a26056ae13e003511a9842a1f021895be27 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_0_self_attn_q_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_10_mlp_up_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_10_mlp_up_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..97e85772f291873729de4a628593c8146d4529ad Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_10_mlp_up_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_10_self_attn_q_proj_bias.fp16 b/deepseek-r1-1.5b-unary/model_layers_10_self_attn_q_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..37c91a27fa24debad38b68b4937718c96e4bfad4 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_10_self_attn_q_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_12_self_attn_k_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_12_self_attn_k_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..3d5fb21e947304ce8698d78b41a7ad53225f45f1 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_12_self_attn_k_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_12_self_attn_o_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_12_self_attn_o_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..96918a7603808743e4e1c65c6e419b8a9660e535 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_12_self_attn_o_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_14_self_attn_v_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_14_self_attn_v_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..7a0b45d4580ae03c74559ab37da0d33c9a2546e6 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_14_self_attn_v_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_16_mlp_gate_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_16_mlp_gate_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..f56ece90071e0e2a193307b0a81483ad2454f358 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_16_mlp_gate_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_16_self_attn_q_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_16_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..8d8ea604df8d924f9dd685f262fda6b5d06b53fa Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_16_self_attn_q_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_17_post_attention_layernorm_weight.fp16 b/deepseek-r1-1.5b-unary/model_layers_17_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..00f889b99c2652a77daf31ccc53d9ced249c3ba3 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_17_post_attention_layernorm_weight.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_17_self_attn_k_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_17_self_attn_k_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..3c9eaca0825c289cec36699ad686980f5de86a47 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_17_self_attn_k_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_17_self_attn_q_proj_bias.fp16 b/deepseek-r1-1.5b-unary/model_layers_17_self_attn_q_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..879dbcd56affcfbd20af9b3450a827e8ac23ac7d Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_17_self_attn_q_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_18_self_attn_o_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_18_self_attn_o_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..b92a3d1aa059446f67f29273333c92a73000e9fb Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_18_self_attn_o_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_19_self_attn_k_proj_weight.sign b/deepseek-r1-1.5b-unary/model_layers_19_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..56f5b49ac5d1a30f808692813610c02ccef558b2 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_19_self_attn_k_proj_weight.sign differ diff --git a/deepseek-r1-1.5b-unary/model_layers_1_mlp_down_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_1_mlp_down_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..0efa47d2f3091f4cb7c90bdef7320406ad4f6723 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_1_mlp_down_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_1_self_attn_k_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_1_self_attn_k_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..5828613ee205b174dbfc1f4f632dd30a4aba5f85 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_1_self_attn_k_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_1_self_attn_v_proj_weight.sign b/deepseek-r1-1.5b-unary/model_layers_1_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f1e1175627aaadb9325d72b57300b82b25c3043f Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_1_self_attn_v_proj_weight.sign differ diff --git a/deepseek-r1-1.5b-unary/model_layers_20_input_layernorm_weight.fp16 b/deepseek-r1-1.5b-unary/model_layers_20_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..8a042895077821880f716b03d5f483d8669cad26 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_20_input_layernorm_weight.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_21_self_attn_q_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_21_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..7b24f3b68a4be50ecc2515725b7a46127de44851 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_21_self_attn_q_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_22_mlp_down_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_22_mlp_down_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..2d8bad17a13035c76a7c181d856e186dacfdd0c3 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_22_mlp_down_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_23_mlp_gate_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_23_mlp_gate_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..29791c352e74b53934fbfc242d29474b4c49db40 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_23_mlp_gate_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_23_self_attn_o_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_23_self_attn_o_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..72120be0ab4fa286df617efb1151549528705b6e Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_23_self_attn_o_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_25_self_attn_q_proj_bias.fp16 b/deepseek-r1-1.5b-unary/model_layers_25_self_attn_q_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..410431ac742d3ccc6fd4615eb565773e2aa1f755 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_25_self_attn_q_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_26_self_attn_v_proj_bias.fp16 b/deepseek-r1-1.5b-unary/model_layers_26_self_attn_v_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..989a0bba49e703f8f30ef4a088a69eccd1f5872a Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_26_self_attn_v_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_27_self_attn_v_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_27_self_attn_v_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..922e1c31b73aeda5ea1dd86e771cf724ac1df764 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_27_self_attn_v_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_3_self_attn_q_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_3_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..b9ed0be039e4f2c1aab8ac5c8660d4394fb1d0a9 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_3_self_attn_q_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_5_self_attn_k_proj_bias.fp16 b/deepseek-r1-1.5b-unary/model_layers_5_self_attn_k_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..770c264cb5354136f1f8a94488d3d68584801d04 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_5_self_attn_k_proj_bias.fp16 differ diff --git a/deepseek-r1-1.5b-unary/model_layers_5_self_attn_k_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_5_self_attn_k_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..73f209462b595cae21608b0f7176940d808b6258 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_5_self_attn_k_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_7_self_attn_k_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_7_self_attn_k_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..f547eab26f3f5a68e9709a358460a4716a9581bf Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_7_self_attn_k_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_8_self_attn_k_proj_weight.sign b/deepseek-r1-1.5b-unary/model_layers_8_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ee7d9d76fb8cd89d756b6e6e59276f5a4c3f77b1 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_8_self_attn_k_proj_weight.sign differ diff --git a/deepseek-r1-1.5b-unary/model_layers_8_self_attn_v_proj_weight.sign b/deepseek-r1-1.5b-unary/model_layers_8_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..66d95813be7a1cc30ac2e2ea3bef606235a0a5c9 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_8_self_attn_v_proj_weight.sign differ diff --git a/deepseek-r1-1.5b-unary/model_layers_9_self_attn_q_proj_bias.fp16 b/deepseek-r1-1.5b-unary/model_layers_9_self_attn_q_proj_bias.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..481af2f5d19a52afd43711747fe2739a46864394 Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_9_self_attn_q_proj_bias.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_0_mlp_up_proj_weight.scales b/qwen3-4b-proper-unary/model_layers_0_mlp_up_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..5a40813b60d708a7b3ac1c0f2159fb11576411ef Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_0_mlp_up_proj_weight.scales differ diff --git a/qwen3-4b-proper-unary/model_layers_0_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_0_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..ddf2325d89c2a0c2969bef8d0733a097cd8ddd92 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_0_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_0_self_attn_k_proj_weight.scales b/qwen3-4b-proper-unary/model_layers_0_self_attn_k_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..75d36c84086581def10646e734682fa962e458e7 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_0_self_attn_k_proj_weight.scales differ diff --git a/qwen3-4b-proper-unary/model_layers_10_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_10_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..5f85f4fb5160a0ee82d91d9ce572e2016da32f4c Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_10_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_11_input_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_11_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..52499e93630e7921e0da2fe4b47f4d798fb1d83d Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_11_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_12_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_12_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..c72775782c008188e316cf30a6b6fdd14c1f5b5f Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_12_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_13_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_13_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..a570d2e3c4bfa60d0a58d8fec2e2608a1983dae1 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_13_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_13_self_attn_k_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_13_self_attn_k_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..a3a4309775e29f06791a78a779e13eac59d8ff86 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_13_self_attn_k_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_13_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_13_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..0357fa9511a40947398e985cb9b6ea2460abc227 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_13_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_14_input_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_14_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..11da36bdf7e6d2f8df7ab1c9445f5190a41c11cf Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_14_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_14_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_14_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..b081241e31201fc433b5d2d1af7ceb760ded4ac1 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_14_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_14_self_attn_k_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_14_self_attn_k_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..a236be9659b02635488cb8616abd215f61833a76 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_14_self_attn_k_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_14_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_14_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..e1d32eeb4ab1cf6b1cf0caa601e86a706d23b032 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_14_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_15_self_attn_k_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_15_self_attn_k_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..766c14e53d76639c9ffb39ca01a9cd72364ea5c9 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_15_self_attn_k_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_1_input_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_1_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..6cd201175102c40b23a4ee170ebabb7e90a7671f Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_1_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_1_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_1_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..696f1e824dcade6562adf0da8bf4dca4bec97fe6 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_1_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_1_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_1_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..ba78fb8ed7135d6aaf3af1d7f6387d4e910ce335 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_1_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_2_input_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_2_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..52fba755b6dba7d9499687ce8c6ed48409dcc802 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_2_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_2_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_2_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..a2375f141a0dbb68bf7ac76f2464ca2375d7e11a Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_2_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_3_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_3_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..3f9c8834a881d34023e4b744ca9d59995da81a15 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_3_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_3_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_3_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..50ba44e8887376265cb4df8a761bd3c327395059 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_3_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_4_input_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_4_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..e44ae9067c229054114f6d04946dc6981c4df6f8 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_4_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_4_self_attn_k_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_4_self_attn_k_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..6debe817ce6410c0d06405cdbfd9835a72fee41b Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_4_self_attn_k_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_5_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_5_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..b7a74aa61fad1efeb335d22d927ad2b260dfe694 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_5_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_7_input_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_7_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..bc8320b03cb74164ca2b8fe4bd7c7ff83651dcb8 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_7_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_7_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_7_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..1bc37e264ee9dae20330eeaa0a9ec2572d0de576 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_7_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_8_post_attention_layernorm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_8_post_attention_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..461f3d92a416feda72f3e42103975fada160278c Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_8_post_attention_layernorm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_8_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_8_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..569fc6ded356dfbd7222bbee713514d14d50b68f Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_8_self_attn_q_norm_weight.fp16 differ diff --git a/qwen3-4b-proper-unary/model_layers_9_self_attn_q_norm_weight.fp16 b/qwen3-4b-proper-unary/model_layers_9_self_attn_q_norm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..4cc2f8b46a2d4070a2bff470095454e6d52195d6 Binary files /dev/null and b/qwen3-4b-proper-unary/model_layers_9_self_attn_q_norm_weight.fp16 differ