Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +49 -0
- deepseek-r1-1.5b-gunary/model_layers_21_self_attn_k_proj_bias.fp16 +0 -0
- deepseek-r1-1.5b-ternary/model_layers_0_mlp_gate_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_10_mlp_down_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_10_mlp_gate_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_10_self_attn_o_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_11_mlp_gate_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_12_mlp_up_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_12_self_attn_o_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_14_mlp_down_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_14_self_attn_o_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_14_self_attn_o_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_16_mlp_up_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_16_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_18_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_18_self_attn_o_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_19_self_attn_q_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_19_self_attn_q_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_1_self_attn_q_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_21_mlp_gate_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_21_mlp_gate_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_21_mlp_up_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_21_self_attn_o_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_22_mlp_down_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_23_mlp_down_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_23_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_23_self_attn_q_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_26_mlp_gate_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_2_self_attn_q_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_3_mlp_down_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_3_mlp_down_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_4_mlp_down_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_4_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_4_self_attn_o_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_5_self_attn_q_proj_weight.pos +3 -0
- deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_7_mlp_down_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.neg +3 -0
- deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.pos +3 -0
.gitattributes
CHANGED
|
@@ -3372,3 +3372,52 @@ qwen3-4b-log-unary/model_layers_35_self_attn_o_proj_weight.sign filter=lfs diff=
|
|
| 3372 |
qwen3-4b-log-unary/model_layers_14_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 3373 |
qwen3-4b-log-unary/model_layers_21_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 3374 |
qwen3-4b-log-unary/model_layers_12_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3372 |
qwen3-4b-log-unary/model_layers_14_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 3373 |
qwen3-4b-log-unary/model_layers_21_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 3374 |
qwen3-4b-log-unary/model_layers_12_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 3375 |
+
deepseek-r1-1.5b-ternary/model_layers_21_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3376 |
+
deepseek-r1-1.5b-ternary/model_layers_10_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3377 |
+
deepseek-r1-1.5b-ternary/model_layers_4_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3378 |
+
deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3379 |
+
deepseek-r1-1.5b-ternary/model_layers_19_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3380 |
+
deepseek-r1-1.5b-ternary/model_layers_21_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3381 |
+
deepseek-r1-1.5b-ternary/model_layers_18_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3382 |
+
deepseek-r1-1.5b-ternary/model_layers_18_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3383 |
+
deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3384 |
+
deepseek-r1-1.5b-ternary/model_layers_22_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3385 |
+
deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3386 |
+
deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3387 |
+
deepseek-r1-1.5b-ternary/model_layers_14_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3388 |
+
deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3389 |
+
deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3390 |
+
deepseek-r1-1.5b-ternary/model_layers_1_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3391 |
+
deepseek-r1-1.5b-ternary/model_layers_21_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3392 |
+
deepseek-r1-1.5b-ternary/model_layers_3_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3393 |
+
deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3394 |
+
deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3395 |
+
deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3396 |
+
deepseek-r1-1.5b-ternary/model_layers_23_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3397 |
+
deepseek-r1-1.5b-ternary/model_layers_8_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3398 |
+
deepseek-r1-1.5b-ternary/model_layers_2_self_attn_q_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3399 |
+
deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3400 |
+
deepseek-r1-1.5b-ternary/model_layers_12_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3401 |
+
deepseek-r1-1.5b-ternary/model_layers_16_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3402 |
+
deepseek-r1-1.5b-ternary/model_layers_3_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3403 |
+
deepseek-r1-1.5b-ternary/model_layers_10_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3404 |
+
deepseek-r1-1.5b-ternary/model_layers_4_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3405 |
+
deepseek-r1-1.5b-ternary/model_layers_0_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3406 |
+
deepseek-r1-1.5b-ternary/model_layers_12_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3407 |
+
deepseek-r1-1.5b-ternary/model_layers_11_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3408 |
+
deepseek-r1-1.5b-ternary/model_layers_21_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3409 |
+
deepseek-r1-1.5b-ternary/model_layers_26_mlp_gate_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3410 |
+
deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3411 |
+
deepseek-r1-1.5b-ternary/model_layers_14_self_attn_o_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3412 |
+
deepseek-r1-1.5b-ternary/model_layers_5_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3413 |
+
deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3414 |
+
deepseek-r1-1.5b-ternary/model_layers_4_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3415 |
+
deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3416 |
+
deepseek-r1-1.5b-ternary/model_layers_23_mlp_up_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3417 |
+
deepseek-r1-1.5b-ternary/model_layers_16_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3418 |
+
deepseek-r1-1.5b-ternary/model_layers_19_self_attn_q_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3419 |
+
deepseek-r1-1.5b-ternary/model_layers_7_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3420 |
+
deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3421 |
+
deepseek-r1-1.5b-ternary/model_layers_14_mlp_down_proj_weight.pos filter=lfs diff=lfs merge=lfs -text
|
| 3422 |
+
deepseek-r1-1.5b-ternary/model_layers_10_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
| 3423 |
+
deepseek-r1-1.5b-ternary/model_layers_23_mlp_down_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
|
deepseek-r1-1.5b-gunary/model_layers_21_self_attn_k_proj_bias.fp16
ADDED
|
Binary file (512 Bytes). View file
|
|
|
deepseek-r1-1.5b-ternary/model_layers_0_mlp_gate_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de489dd041b078296df2bfdf3957ee757314de4a17e48ef8928c67484928d4a3
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_10_mlp_down_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3462dfd3b9426d07c67c759bc05e072625faa8d8b5c426d818ca336651a4db3
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_10_mlp_gate_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e5388a8688a1f1020023b7c64a10a534abc73b9fa667c7418d3c6a1e09b5edb
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_10_self_attn_o_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59da0e8e2bef01955a29588574acbc531714c1ed4be58205e19f1d15077224b5
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_11_mlp_down_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2234be9dfa8679b5377218d2c9a087d193506fa5ec3466c47baaa924becab497
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_11_mlp_gate_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5deb6871e4f603ac8a2902a52a8b50519b3f0db755cf523a713d326fb84b1271
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_12_mlp_up_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b0488008f7a3492aca2c31600eae8628633cd136e817c5a7a7862ec86d49745
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_12_self_attn_o_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24b622d6462b3e932e02afd7a6a27e1be3613e825e9a5a64a29903581dbad5bc
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_14_mlp_down_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4cbff4fce66e97beac6bb5b73c8b71e3fe08bb0faa73d8dfe220cf7752c4f259
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_14_self_attn_o_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf01c0f7247214f93de6a50a4f65eb1f16f279be635d0f82923c842559773e7f
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_14_self_attn_o_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9007fc19f7189394e897296bb7d64b63129f7f85503046bbb2ebe4dc26e93bc4
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_15_mlp_down_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8dcf9541fd16f739e08d74fd5f517c9902e7051ce4c974fb03b008ee6d84319f
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_16_mlp_up_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a4426c8083aa7e392ca710efdd65264a0c9c4eb6cc2009e3c386e68039f9490
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_16_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20991dd62db1c465f05535c62d46c4780fdfd5a635bebed811ecda1ca60d7db1
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_17_mlp_down_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea52af4db0fc5b759bc77415307b5a7fc3a802614f9f2df2ea06c0a086c01f8b
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_17_mlp_gate_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35dfff0a7c66c1b0b38fb5f3f1f10e6a105d16cbabb0f553fbd374ee408472fa
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_18_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccf0b420c9fa96261d1a6e32ef8d882abc047cf9b1b444abdefd264714c15b46
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_18_self_attn_o_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09a35140fef4e3fae793001b49a9742eaa2a482286af9da8687607a2111c421e
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_19_self_attn_q_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6aeb6783c725134d48dedb4213e1613952e370d0059eb57e1ce0c6b232a9090a
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_19_self_attn_q_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:652b2a4a2b436b14806b9fed94989c7fc1dab6508d46099e7c853a5068ed28be
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_1_self_attn_q_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba25ff746e015eaab25813f2af4ceb17e9c8f9abb50c9516d70a01e5e3cfaba2
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_21_mlp_gate_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:425d692aff34d727e9dc018d70935a0e1357916bf873498da28a0bd874bbd63b
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_21_mlp_gate_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92bf85e0c847fa1abfc558f3ba06561cb9d1e7f3117808c12490a32c64d15f8d
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_21_mlp_up_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2b8797ae6228937734c740231274307e3cb0718f6ffb613164a1cc5f779e5c6
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_21_self_attn_o_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a051535127ce040530c92b18e8b18800d5f259c081e52a480bb117898c5aedf
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_22_mlp_down_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de898333032d190f4887fa86619c319f0a8697656a119468a131ec4fe16b9159
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_22_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:425892268cb48f981b1ce4dfd4ddad025ff5506894d4e73cb18238e4de1db1d3
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_23_mlp_down_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55d0d34ec2e1d7d1bef900d0a2aa397d31c7a8b51253a83c616b128cad64b53a
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_23_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e7e311cb4d16d846ccafdb92b4499d2ddbdb6ad648f0d9f5212803bd9580daa
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_23_self_attn_q_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d813b92570faff377d0bebab455d5c1f7c4de52a5543e2e950047afcadeb102
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_25_self_attn_q_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9e9071416181392dc6c267e32bb8d81c2ec6e10e140037c22dd42f1b7c64d3d
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_26_mlp_gate_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b819c077f00e2d1ce42f8d69fe7505568c9db0f75064c0163635be8d0cb8ccdd
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_27_mlp_gate_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d60dbb21674219ecf6de83e0af4c0ca27fabde724995da0e8b2ba405bf3e859f
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_2_mlp_up_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73b3889d44fe85ed05c0b0fc5b97a44df2452ec2d83d83920e375f62bf6c7e0c
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_2_self_attn_q_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98161995eb25076ed4fdd35a313307fb1bf6deb1be35704b977cf45da53866a3
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_3_mlp_down_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6f4cfe1994854ecfe3661ee6e26aebe41c8c083b3e771fcc869edc56d99ce11
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_3_mlp_down_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a5c215f2d6e5d315f435d4cfc784a90edeb3ad2959307a9ca1e43a2c8af9711
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_3_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0af187d3d7cabb7d40532bd1b1e3a39f4df40bde94282c639ec764ef8c232489
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_4_mlp_down_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a04cd57597475d07339c7967ce3777bdf6d28cb41408539c88a4a5353db8380
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_4_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b072bf0ed483cdd4de445d55a5155e026785176234858caad086ed6914dbc1b
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_4_self_attn_o_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba22d2a6324dc7be784edd4247df14d6c143f5026b8b110f08a013351bce8be5
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_5_mlp_up_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:478cbfe9e6a0b41164a6ab7b3809c2120203cbc8adb96ae084a7b6de49038e04
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_5_self_attn_o_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc0f5faf3513cd391086d7c1337684e1818b4af5efae1f5345704b70da3df607
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_5_self_attn_q_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:005c37f33205eacaf398a7cf62c315ce0cd576abc4fe7f0bfe0802eebe23e178
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_6_mlp_up_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a4a9b0f7f109076bd1a9293648dddb2c355980efaae72954bee4dff0babf1ba6
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_7_mlp_down_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5ffd2c5dd95f95a2178f3bd7698e954681356d8aa8518213a65b30333c1ab01
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-ternary/model_layers_7_self_attn_o_proj_weight.neg
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f85a1678addaff23f2e763505b855d2e1605c5fac8828d0e8497e0720077b0d
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-ternary/model_layers_8_mlp_down_proj_weight.pos
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0067e74da702cb0a0c04039ec4a8629652e1ebdcbe7e36f4854ab1bcdc7dcef5
|
| 3 |
+
size 1720320
|