Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +69 -0
- deepseek-r1-1.5b-packed/model_layers_0_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_0_self_attn_o_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_10_mlp_down_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_10_mlp_up_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_10_self_attn_o_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_11_self_attn_o_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_12_self_attn_q_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_13_mlp_down_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_13_self_attn_q_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_14_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_14_mlp_up_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_14_self_attn_o_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_14_self_attn_q_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_15_mlp_down_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_15_mlp_up_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_15_self_attn_o_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_16_mlp_down_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_16_self_attn_o_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_18_mlp_up_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_18_self_attn_q_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_19_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_1_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_20_self_attn_v_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_21_mlp_down_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_23_mlp_gate_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_24_mlp_down_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_24_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_24_self_attn_q_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_25_mlp_up_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_25_self_attn_q_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_25_self_attn_v_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_26_mlp_down_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_26_mlp_up_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_27_mlp_down_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_2_mlp_down_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_2_mlp_up_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_2_self_attn_q_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.signs +3 -0
- deepseek-r1-1.5b-packed/model_layers_3_self_attn_k_proj_weight.mags +3 -0
- deepseek-r1-1.5b-packed/model_layers_3_self_attn_o_proj_weight.signs +3 -0
.gitattributes
CHANGED
|
@@ -3459,3 +3459,72 @@ deepseek-r1-1.5b-packed/model_layers_9_self_attn_q_proj_weight.mags filter=lfs d
|
|
| 3459 |
deepseek-r1-1.5b-packed/model_layers_1_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3460 |
deepseek-r1-1.5b-packed/model_layers_8_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3461 |
deepseek-r1-1.5b-packed/model_layers_19_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3459 |
deepseek-r1-1.5b-packed/model_layers_1_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3460 |
deepseek-r1-1.5b-packed/model_layers_8_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3461 |
deepseek-r1-1.5b-packed/model_layers_19_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3462 |
+
deepseek-r1-1.5b-packed/model_layers_11_self_attn_o_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3463 |
+
deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3464 |
+
deepseek-r1-1.5b-packed/model_layers_21_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3465 |
+
deepseek-r1-1.5b-packed/model_layers_15_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3466 |
+
deepseek-r1-1.5b-packed/model_layers_4_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3467 |
+
deepseek-r1-1.5b-packed/model_layers_24_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3468 |
+
deepseek-r1-1.5b-packed/model_layers_13_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3469 |
+
deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3470 |
+
deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3471 |
+
deepseek-r1-1.5b-packed/model_layers_18_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3472 |
+
deepseek-r1-1.5b-packed/model_layers_10_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3473 |
+
deepseek-r1-1.5b-packed/model_layers_0_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3474 |
+
deepseek-r1-1.5b-packed/model_layers_4_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3475 |
+
deepseek-r1-1.5b-packed/model_layers_4_self_attn_k_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3476 |
+
deepseek-r1-1.5b-packed/model_layers_7_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3477 |
+
deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3478 |
+
deepseek-r1-1.5b-packed/model_layers_20_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3479 |
+
deepseek-r1-1.5b-packed/model_layers_26_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3480 |
+
deepseek-r1-1.5b-packed/model_layers_4_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3481 |
+
deepseek-r1-1.5b-packed/model_layers_14_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3482 |
+
deepseek-r1-1.5b-packed/model_layers_0_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3483 |
+
deepseek-r1-1.5b-packed/model_layers_24_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3484 |
+
deepseek-r1-1.5b-packed/model_layers_12_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3485 |
+
deepseek-r1-1.5b-packed/model_layers_6_self_attn_k_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3486 |
+
deepseek-r1-1.5b-packed/model_layers_24_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3487 |
+
deepseek-r1-1.5b-packed/model_layers_19_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3488 |
+
deepseek-r1-1.5b-packed/model_layers_13_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3489 |
+
deepseek-r1-1.5b-packed/model_layers_3_self_attn_k_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3490 |
+
deepseek-r1-1.5b-packed/model_layers_14_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3491 |
+
deepseek-r1-1.5b-packed/model_layers_2_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3492 |
+
deepseek-r1-1.5b-packed/model_layers_10_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3493 |
+
deepseek-r1-1.5b-packed/model_layers_7_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3494 |
+
deepseek-r1-1.5b-packed/model_layers_27_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3495 |
+
deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3496 |
+
deepseek-r1-1.5b-packed/model_layers_8_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3497 |
+
deepseek-r1-1.5b-packed/model_layers_8_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3498 |
+
deepseek-r1-1.5b-packed/model_layers_10_self_attn_o_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3499 |
+
deepseek-r1-1.5b-packed/model_layers_26_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3500 |
+
deepseek-r1-1.5b-packed/model_layers_1_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3501 |
+
deepseek-r1-1.5b-packed/model_layers_5_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3502 |
+
deepseek-r1-1.5b-packed/model_layers_25_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3503 |
+
deepseek-r1-1.5b-packed/model_layers_16_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3504 |
+
deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3505 |
+
deepseek-r1-1.5b-packed/model_layers_14_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3506 |
+
deepseek-r1-1.5b-packed/model_layers_15_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3507 |
+
deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3508 |
+
deepseek-r1-1.5b-packed/model_layers_8_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3509 |
+
deepseek-r1-1.5b-packed/model_layers_2_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3510 |
+
deepseek-r1-1.5b-packed/model_layers_23_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3511 |
+
deepseek-r1-1.5b-packed/model_layers_3_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3512 |
+
deepseek-r1-1.5b-packed/model_layers_8_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3513 |
+
deepseek-r1-1.5b-packed/model_layers_25_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3514 |
+
deepseek-r1-1.5b-packed/model_layers_3_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3515 |
+
deepseek-r1-1.5b-packed/model_layers_2_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3516 |
+
deepseek-r1-1.5b-packed/model_layers_5_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3517 |
+
deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3518 |
+
deepseek-r1-1.5b-packed/model_layers_14_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3519 |
+
deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3520 |
+
deepseek-r1-1.5b-packed/model_layers_15_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3521 |
+
deepseek-r1-1.5b-packed/model_layers_25_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3522 |
+
deepseek-r1-1.5b-packed/model_layers_7_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3523 |
+
deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3524 |
+
deepseek-r1-1.5b-packed/model_layers_16_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
|
| 3525 |
+
deepseek-r1-1.5b-ternary/lm_head_weight.fp16 filter=lfs diff=lfs merge=lfs -text
|
| 3526 |
+
qwen3-4b-log-unary/model_layers_31_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 3527 |
+
qwen3-4b-log-unary/model_layers_11_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
|
| 3528 |
+
qwen3-4b-log-unary/model_layers_34_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
| 3529 |
+
deepseek-r1-1.5b-packed/model_layers_18_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
|
| 3530 |
+
qwen3-4b-log-unary/model_layers_5_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
|
deepseek-r1-1.5b-packed/model_layers_0_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cf601ab6062858b266017e3ccc33f77bb1a6560510ddb28d0bddd9822adbd0b
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_0_self_attn_o_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afa7c60db5e54d8009750dd241125670907a01f6b0741fecf14e3983914efbbe
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_10_mlp_down_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a5e09aa32752f84f4114b5b54e34265df514994b6c81f251137e17aacc70dbb
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_10_mlp_up_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:137cc07609c4da4aacd304b4fbb93a179102e1f1a78384d3e4f87c40eabb4810
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_10_self_attn_o_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa7257bc144ffb551a57b916fbc440d469b66da3d2d62118cb329f4b9ad9684e
|
| 3 |
+
size 2359296
|
deepseek-r1-1.5b-packed/model_layers_11_self_attn_o_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1b174d36ebc596462d284b4973fb866ce3a544714469cd4545b2c4cb7da12d3
|
| 3 |
+
size 2359296
|
deepseek-r1-1.5b-packed/model_layers_12_self_attn_q_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa8874205a1141bacaae9fdcf35ac12c56211a602ebefcde5e571e9429da90d4
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_13_mlp_down_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6075f12919d7c179856251bd7f4c167d128f7fe2438d968ab3be9eddbacc85a8
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_13_self_attn_q_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81f0c5fe941e1407a517b0d3ce5f3afad1ec859845e5f8c34fdcfffd5b310316
|
| 3 |
+
size 2359296
|
deepseek-r1-1.5b-packed/model_layers_14_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c6a62b3e005442b9ac9a51a505347398cd9a43d80b5bedf204ae184f08a8c715
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_14_mlp_up_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:552bbc316a158a222d6c94d1b4d54de495b53cde5f3a4883ab9fba02cdbc62b8
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_14_self_attn_o_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0fde78bfd9522524f658236e046ecd0d2189aa0a092c9ddfb2577c3e982bc70
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_14_self_attn_q_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b1d71717a33bae43b6cc287107fa866ebf2d3a053742a709381035b2c234a66
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_15_mlp_down_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b684bcc0c65183e127d15e995f38140b7c7fa34626ffbdf52377bfd192205a9e
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_15_mlp_up_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5206a02260028ee28fbde6edf9df24199656473b0a98f2b038b7fc841608e572
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_15_self_attn_o_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a564f99a29539779b4e31ec8e2238c03ccace4c568b8495bd5028f5fc08e9416
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_16_mlp_down_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f627c09a596845e3d789efe2accb30b956cdad47f79f54fb9bc252285435cade
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_16_self_attn_o_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb4b96ddf727cc680c1f0360ff51b143b0e66d45792330cd4e0bb2edfb01ae96
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_18_mlp_up_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ef5a4b93278c3ed4f21af7c482d30379e5399e1a9e60f402ce2e10198375909
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_18_self_attn_q_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0cc73697f7d2c00e8a7ba5c1d7a5006479360a95f8a8860700b53aa831558a47
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_19_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3841fa4a3deed727ad7bbd14feddf9b931fa10c645be97f7a41d84cbcbd5b85d
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acdad830fec332f219ae63313954f982c97c74289dd00cd982dd76a421434b3a
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a04a4f84162379d5b772eb736221f21122838357c7f701c728b695f7f21f48f
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_1_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18d4f22d7a9844c265b8737f51512a8b9c3e83f8b3df30a048d2d1312bd89579
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_20_self_attn_v_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ca36ec8e518c40248700b7a6d036c79cfe6818c9bee9e9fed9db468c6a3076f
|
| 3 |
+
size 393216
|
deepseek-r1-1.5b-packed/model_layers_21_mlp_down_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67575cd43df52fa550be594f9da1901d582a2f2e48978a0044e5b366c6b1ae65
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_23_mlp_gate_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acab9a847d202ed9f67041eb8476855da21ec3afa42076c05927753fb95080eb
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_24_mlp_down_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86cca1f83a0b656b5b9e895a32797309e95088fbac4b80be1b53df380e4c1b66
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_24_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af1a304248edd39a9d41760fd0f5d5029c19e8b9c30b62f1b59b6c55fe0c3d5d
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_24_self_attn_q_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c4f9f5baf1b98926d34cf108276fbaa3befccc402d33ed2ed86280c02a46f99
|
| 3 |
+
size 2359296
|
deepseek-r1-1.5b-packed/model_layers_25_mlp_up_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85914f8567316fb3a505d76f4efbffddeda82b252fca0f004b115729fc5eece4
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_25_self_attn_q_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab7767bff8b90fbd314c81bdad8d407998989525b07c4ebab9ae1f804c7660ee
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_25_self_attn_v_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01f6eb9e37e5d4eb688cd86bc5ca50b7458115f1c90782281a2af717a743ba43
|
| 3 |
+
size 393216
|
deepseek-r1-1.5b-packed/model_layers_26_mlp_down_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1514a78827202a31b5fabb4a56b194c40d60c75b42c2c473e509e90fd1ceec9
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_26_mlp_up_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92e1883be31668ba4dea2a96bb00286e7812c2309c109fefc110faf0d2ac552d
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_27_mlp_down_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17b2a47c92099e72ef70301bb9d3098db3866a3c904a4172d87039e4d15aee85
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a20c45b40daed6a805b60745abd5a5e6d541b2b2bfc9ef541b476ca7743af229
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7742df58b2eb17912b598df0a2c405b98498924d8ff2523673d0c4d7137fa785
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7554f62302d4402c2a8617792efcdd9dcf3b22b78c3081170478e367959faab9
|
| 3 |
+
size 2359296
|
deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f989aaae9b5c070f1c5236956b2a7a0c0821b0355b6556e2cf0dcc9f879a6117
|
| 3 |
+
size 294912
|
deepseek-r1-1.5b-packed/model_layers_2_mlp_down_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2950b33b7d98c3eb340722c3a5e376efb73136698d9c0aabdb09d9e2728117c2
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d99cdb9b5656662e94b69d5497d1ddc62b52fe4d5f9788c11249934c8ebc720
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6acd236a009c2c646537035d07ed56d1f1a7e4bfd8e9b83a2e6c6ecf7c531bc8
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_2_mlp_up_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2208f57cf0144c098accb4a7145eda1e77cd1ffd2f9ca9f78b768badd53efcd
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_2_self_attn_q_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93da71f8a8f102d0d16d51aaad2da5559f0196f628efb9364557b2107970952c
|
| 3 |
+
size 2359296
|
deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1158378bb9adc7b73b040cd10215c0d6ba53d8916bbb732ca37b6bf8f4242eb2
|
| 3 |
+
size 13762560
|
deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd3b8fb93a12a2e9411ec693f5e761da80b09734ca758f2ddd06cb83365677bb
|
| 3 |
+
size 1720320
|
deepseek-r1-1.5b-packed/model_layers_3_self_attn_k_proj_weight.mags
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3be5411a8d1c31c6a292e80c20ecd2355a3c84d648686308d01022ad72523b6f
|
| 3 |
+
size 393216
|
deepseek-r1-1.5b-packed/model_layers_3_self_attn_o_proj_weight.signs
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f794bbcdffd07b8719ce97780dab4eabc04d310bbe111dfba7f8205fb80b684
|
| 3 |
+
size 294912
|