Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +42 -0
- deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_0_self_attn_v_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_10_post_attention_layernorm_weight.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_10_self_attn_k_proj_weight.sign +0 -0
- deepseek-r1-1.5b-unary4/model_layers_10_self_attn_v_proj_weight.sign +0 -0
- deepseek-r1-1.5b-unary4/model_layers_11_mlp_down_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_11_mlp_up_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_11_self_attn_k_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_11_self_attn_v_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_12_self_attn_k_proj_bias.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_12_self_attn_o_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_12_self_attn_v_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_13_mlp_gate_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_14_mlp_up_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_bias.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_16_input_layernorm_weight.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_16_mlp_up_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_16_post_attention_layernorm_weight.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_16_self_attn_k_proj_bias.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.sign +0 -0
- deepseek-r1-1.5b-unary4/model_layers_17_mlp_up_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_18_self_attn_k_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_18_self_attn_o_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_bias.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_19_input_layernorm_weight.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_19_self_attn_o_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_19_self_attn_v_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_1_self_attn_v_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_20_self_attn_q_proj_bias.fp16 +0 -0
- deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_21_self_attn_k_proj_weight.sign +0 -0
- deepseek-r1-1.5b-unary4/model_layers_21_self_attn_v_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.planes +3 -0
- deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.sign +3 -0
- deepseek-r1-1.5b-unary4/model_layers_22_mlp_up_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_22_self_attn_o_proj_weight.scales +0 -0
- deepseek-r1-1.5b-unary4/model_layers_22_self_attn_v_proj_weight.scales +0 -0
.gitattributes
CHANGED
|
@@ -2890,3 +2890,45 @@ qwen3-4b-log-unary/model_layers_27_self_attn_k_proj_weight.sign filter=lfs diff=
|
|
| 2890 |
qwen3-4b-log-unary/model_layers_2_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2891 |
qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2892 |
qwen3-4b-log-unary/model_layers_31_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2890 |
qwen3-4b-log-unary/model_layers_2_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2891 |
qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2892 |
qwen3-4b-log-unary/model_layers_31_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2893 |
+
deepseek-r1-1.5b-unary4/model_layers_11_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2894 |
+
deepseek-r1-1.5b-unary4/model_layers_4_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2895 |
+
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2896 |
+
deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2897 |
+
deepseek-r1-1.5b-unary4/model_layers_26_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2898 |
+
deepseek-r1-1.5b-unary4/model_layers_6_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2899 |
+
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2900 |
+
deepseek-r1-1.5b-unary4/model_layers_27_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2901 |
+
deepseek-r1-1.5b-unary4/model_layers_27_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2902 |
+
deepseek-r1-1.5b-unary4/model_layers_27_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2903 |
+
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2904 |
+
deepseek-r1-1.5b-unary4/model_layers_19_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2905 |
+
deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2906 |
+
deepseek-r1-1.5b-unary4/model_layers_17_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2907 |
+
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2908 |
+
deepseek-r1-1.5b-unary4/model_layers_7_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2909 |
+
deepseek-r1-1.5b-unary4/model_layers_3_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2910 |
+
deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2911 |
+
deepseek-r1-1.5b-unary4/model_layers_8_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2912 |
+
deepseek-r1-1.5b-unary4/model_layers_25_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2913 |
+
deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2914 |
+
deepseek-r1-1.5b-unary4/model_layers_27_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2915 |
+
deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2916 |
+
deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2917 |
+
deepseek-r1-1.5b-unary4/model_layers_25_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2918 |
+
deepseek-r1-1.5b-unary4/model_layers_5_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2919 |
+
deepseek-r1-1.5b-unary4/model_layers_2_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2920 |
+
deepseek-r1-1.5b-unary4/model_layers_27_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2921 |
+
deepseek-r1-1.5b-unary4/model_layers_3_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2922 |
+
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2923 |
+
deepseek-r1-1.5b-unary4/model_layers_24_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2924 |
+
deepseek-r1-1.5b-unary4/model_layers_23_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2925 |
+
deepseek-r1-1.5b-unary4/model_layers_5_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2926 |
+
deepseek-r1-1.5b-unary4/model_layers_14_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2927 |
+
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2928 |
+
deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2929 |
+
deepseek-r1-1.5b-unary4/model_layers_2_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2930 |
+
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2931 |
+
deepseek-r1-1.5b-unary4/model_layers_23_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 2932 |
+
deepseek-r1-1.5b-unary4/model_layers_25_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2933 |
+
deepseek-r1-1.5b-unary4/model_layers_2_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 2934 |
+
deepseek-r1-1.5b-unary4/model_layers_5_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.scales
ADDED
|
Binary file (35.8 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cf601ab6062858b266017e3ccc33f77bb1a6560510ddb28d0bddd9822adbd0b
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-unary4/model_layers_0_self_attn_v_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f005c0c74e5f79d926d9db3cb02f312d03559c820b03e4d45eb1fc381f2d303f
|
| 3 |
+
size 6881280
|
deepseek-r1-1.5b-unary4/model_layers_10_post_attention_layernorm_weight.fp16
ADDED
|
Binary file (3.07 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_10_self_attn_k_proj_weight.sign
ADDED
|
Binary file (49.2 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_10_self_attn_v_proj_weight.sign
ADDED
|
Binary file (49.2 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_11_mlp_down_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b07cb8f37f8c3fb5f800b008ee48cc27f089db360aa642d7498bc09b8314e21c
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-unary4/model_layers_11_mlp_up_proj_weight.scales
ADDED
|
Binary file (35.8 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_k_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:391743aaf15f6307bc9b667a575007cea922b964c44b55499f683657c675cf1b
|
| 3 |
+
size 1179648
|
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.scales
ADDED
|
Binary file (6.14 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_v_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e61fcc0005e9bc64d8257306654eacd8cf2a8b302e1b4c68c707f52b894c770f
|
| 3 |
+
size 196608
|
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_k_proj_bias.fp16
ADDED
|
Binary file (512 Bytes). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_o_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b99c13197a9fd4d1233f95ba7aeaff88e06a93d91c95bb771fda4f56567a3cf2
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_v_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_13_mlp_gate_proj_weight.scales
ADDED
|
Binary file (35.8 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_14_mlp_up_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71036189bc6c7101b6bebd0447e5613b8373df5f4687f35de2606e06905c73e1
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_bias.fp16
ADDED
|
Binary file (512 Bytes). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_16_input_layernorm_weight.fp16
ADDED
|
Binary file (3.07 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_16_mlp_up_proj_weight.scales
ADDED
|
Binary file (35.8 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_16_post_attention_layernorm_weight.fp16
ADDED
|
Binary file (3.07 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_16_self_attn_k_proj_bias.fp16
ADDED
|
Binary file (512 Bytes). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.sign
ADDED
|
Binary file (49.2 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_17_mlp_up_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a2696679b07fd134e164866f5fc097081e6905a936b75b9be2c75e60a811954
|
| 3 |
+
size 6881280
|
deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b2e8be702da7bd0675f0f830d4b54f5bbb43f884a6f95dc438791e6c91be091e
|
| 3 |
+
size 1179648
|
deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.scales
ADDED
|
Binary file (6.14 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_k_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa6452b5d4d246665da65f5db002758e0d27b5767dc46064f81d4b3fce597813
|
| 3 |
+
size 196608
|
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_o_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7809020bf04c489051e22e07494b20557ab1d7b99b6ac74741b55206a6092b4
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_bias.fp16
ADDED
|
Binary file (3.07 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0cc73697f7d2c00e8a7ba5c1d7a5006479360a95f8a8860700b53aa831558a47
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-unary4/model_layers_19_input_layernorm_weight.fp16
ADDED
|
Binary file (3.07 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_19_self_attn_o_proj_weight.scales
ADDED
|
Binary file (6.14 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_19_self_attn_v_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6ad6327989a0def858d1449b0926b9ccdc0c3144690ab365e747325ea374779
|
| 3 |
+
size 196608
|
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:42d7c59df70a966def7b8582254155515b7e5c85f6b4a9036fcca78e3e5dca48
|
| 3 |
+
size 1179648
|
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.scales
ADDED
|
Binary file (6.14 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_v_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_20_self_attn_q_proj_bias.fp16
ADDED
|
Binary file (3.07 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a0bba536126dbf01e52d8c8d2f5e1344e021358015f8d38aa27ce08a632112b
|
| 3 |
+
size 6881280
|
deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:154c898127685a5d1f62f4d132b2ddb359cf897cf0567784b03eff0baa5c31fb
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-unary4/model_layers_21_self_attn_k_proj_weight.sign
ADDED
|
Binary file (49.2 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_21_self_attn_v_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.planes
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1513867e9552859d2ec309485f86a9bc766b34df35f2704a5c0a5182f459b138
|
| 3 |
+
size 6881280
|
deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.sign
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0cead535970fe45255a6aace0b589ee94e9ccc3daf2499e7af6e07d56599e3c3
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-unary4/model_layers_22_mlp_up_proj_weight.scales
ADDED
|
Binary file (35.8 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_22_self_attn_o_proj_weight.scales
ADDED
|
Binary file (6.14 kB). View file
|
|
|
deepseek-r1-1.5b-unary4/model_layers_22_self_attn_v_proj_weight.scales
ADDED
|
Binary file (1.02 kB). View file
|
|
|