OpenTransformer commited on
Commit
8dff24e
·
verified ·
1 Parent(s): b63bc73

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +69 -0
  2. deepseek-r1-1.5b-packed/model_layers_0_mlp_gate_proj_weight.signs +3 -0
  3. deepseek-r1-1.5b-packed/model_layers_0_self_attn_o_proj_weight.signs +3 -0
  4. deepseek-r1-1.5b-packed/model_layers_10_mlp_down_proj_weight.mags +3 -0
  5. deepseek-r1-1.5b-packed/model_layers_10_mlp_up_proj_weight.signs +3 -0
  6. deepseek-r1-1.5b-packed/model_layers_10_self_attn_o_proj_weight.mags +3 -0
  7. deepseek-r1-1.5b-packed/model_layers_11_self_attn_o_proj_weight.mags +3 -0
  8. deepseek-r1-1.5b-packed/model_layers_12_self_attn_q_proj_weight.signs +3 -0
  9. deepseek-r1-1.5b-packed/model_layers_13_mlp_down_proj_weight.mags +3 -0
  10. deepseek-r1-1.5b-packed/model_layers_13_self_attn_q_proj_weight.mags +3 -0
  11. deepseek-r1-1.5b-packed/model_layers_14_mlp_gate_proj_weight.signs +3 -0
  12. deepseek-r1-1.5b-packed/model_layers_14_mlp_up_proj_weight.mags +3 -0
  13. deepseek-r1-1.5b-packed/model_layers_14_self_attn_o_proj_weight.signs +3 -0
  14. deepseek-r1-1.5b-packed/model_layers_14_self_attn_q_proj_weight.signs +3 -0
  15. deepseek-r1-1.5b-packed/model_layers_15_mlp_down_proj_weight.signs +3 -0
  16. deepseek-r1-1.5b-packed/model_layers_15_mlp_up_proj_weight.signs +3 -0
  17. deepseek-r1-1.5b-packed/model_layers_15_self_attn_o_proj_weight.signs +3 -0
  18. deepseek-r1-1.5b-packed/model_layers_16_mlp_down_proj_weight.signs +3 -0
  19. deepseek-r1-1.5b-packed/model_layers_16_self_attn_o_proj_weight.signs +3 -0
  20. deepseek-r1-1.5b-packed/model_layers_18_mlp_up_proj_weight.mags +3 -0
  21. deepseek-r1-1.5b-packed/model_layers_18_self_attn_q_proj_weight.signs +3 -0
  22. deepseek-r1-1.5b-packed/model_layers_19_mlp_gate_proj_weight.signs +3 -0
  23. deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.mags +3 -0
  24. deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.signs +3 -0
  25. deepseek-r1-1.5b-packed/model_layers_1_mlp_gate_proj_weight.signs +3 -0
  26. deepseek-r1-1.5b-packed/model_layers_20_self_attn_v_proj_weight.mags +3 -0
  27. deepseek-r1-1.5b-packed/model_layers_21_mlp_down_proj_weight.mags +3 -0
  28. deepseek-r1-1.5b-packed/model_layers_23_mlp_gate_proj_weight.mags +3 -0
  29. deepseek-r1-1.5b-packed/model_layers_24_mlp_down_proj_weight.signs +3 -0
  30. deepseek-r1-1.5b-packed/model_layers_24_mlp_gate_proj_weight.signs +3 -0
  31. deepseek-r1-1.5b-packed/model_layers_24_self_attn_q_proj_weight.mags +3 -0
  32. deepseek-r1-1.5b-packed/model_layers_25_mlp_up_proj_weight.signs +3 -0
  33. deepseek-r1-1.5b-packed/model_layers_25_self_attn_q_proj_weight.signs +3 -0
  34. deepseek-r1-1.5b-packed/model_layers_25_self_attn_v_proj_weight.mags +3 -0
  35. deepseek-r1-1.5b-packed/model_layers_26_mlp_down_proj_weight.mags +3 -0
  36. deepseek-r1-1.5b-packed/model_layers_26_mlp_up_proj_weight.signs +3 -0
  37. deepseek-r1-1.5b-packed/model_layers_27_mlp_down_proj_weight.mags +3 -0
  38. deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.mags +3 -0
  39. deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.signs +3 -0
  40. deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.mags +3 -0
  41. deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.signs +3 -0
  42. deepseek-r1-1.5b-packed/model_layers_2_mlp_down_proj_weight.mags +3 -0
  43. deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.mags +3 -0
  44. deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.signs +3 -0
  45. deepseek-r1-1.5b-packed/model_layers_2_mlp_up_proj_weight.mags +3 -0
  46. deepseek-r1-1.5b-packed/model_layers_2_self_attn_q_proj_weight.mags +3 -0
  47. deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.mags +3 -0
  48. deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.signs +3 -0
  49. deepseek-r1-1.5b-packed/model_layers_3_self_attn_k_proj_weight.mags +3 -0
  50. deepseek-r1-1.5b-packed/model_layers_3_self_attn_o_proj_weight.signs +3 -0
.gitattributes CHANGED
@@ -3459,3 +3459,72 @@ deepseek-r1-1.5b-packed/model_layers_9_self_attn_q_proj_weight.mags filter=lfs d
3459
  deepseek-r1-1.5b-packed/model_layers_1_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3460
  deepseek-r1-1.5b-packed/model_layers_8_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3461
  deepseek-r1-1.5b-packed/model_layers_19_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3459
  deepseek-r1-1.5b-packed/model_layers_1_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3460
  deepseek-r1-1.5b-packed/model_layers_8_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3461
  deepseek-r1-1.5b-packed/model_layers_19_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3462
+ deepseek-r1-1.5b-packed/model_layers_11_self_attn_o_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3463
+ deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3464
+ deepseek-r1-1.5b-packed/model_layers_21_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3465
+ deepseek-r1-1.5b-packed/model_layers_15_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3466
+ deepseek-r1-1.5b-packed/model_layers_4_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3467
+ deepseek-r1-1.5b-packed/model_layers_24_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3468
+ deepseek-r1-1.5b-packed/model_layers_13_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3469
+ deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3470
+ deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3471
+ deepseek-r1-1.5b-packed/model_layers_18_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3472
+ deepseek-r1-1.5b-packed/model_layers_10_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3473
+ deepseek-r1-1.5b-packed/model_layers_0_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3474
+ deepseek-r1-1.5b-packed/model_layers_4_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3475
+ deepseek-r1-1.5b-packed/model_layers_4_self_attn_k_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3476
+ deepseek-r1-1.5b-packed/model_layers_7_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3477
+ deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3478
+ deepseek-r1-1.5b-packed/model_layers_20_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3479
+ deepseek-r1-1.5b-packed/model_layers_26_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3480
+ deepseek-r1-1.5b-packed/model_layers_4_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3481
+ deepseek-r1-1.5b-packed/model_layers_14_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3482
+ deepseek-r1-1.5b-packed/model_layers_0_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3483
+ deepseek-r1-1.5b-packed/model_layers_24_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3484
+ deepseek-r1-1.5b-packed/model_layers_12_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3485
+ deepseek-r1-1.5b-packed/model_layers_6_self_attn_k_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3486
+ deepseek-r1-1.5b-packed/model_layers_24_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3487
+ deepseek-r1-1.5b-packed/model_layers_19_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3488
+ deepseek-r1-1.5b-packed/model_layers_13_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3489
+ deepseek-r1-1.5b-packed/model_layers_3_self_attn_k_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3490
+ deepseek-r1-1.5b-packed/model_layers_14_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3491
+ deepseek-r1-1.5b-packed/model_layers_2_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3492
+ deepseek-r1-1.5b-packed/model_layers_10_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3493
+ deepseek-r1-1.5b-packed/model_layers_7_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3494
+ deepseek-r1-1.5b-packed/model_layers_27_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3495
+ deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3496
+ deepseek-r1-1.5b-packed/model_layers_8_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3497
+ deepseek-r1-1.5b-packed/model_layers_8_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3498
+ deepseek-r1-1.5b-packed/model_layers_10_self_attn_o_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3499
+ deepseek-r1-1.5b-packed/model_layers_26_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3500
+ deepseek-r1-1.5b-packed/model_layers_1_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3501
+ deepseek-r1-1.5b-packed/model_layers_5_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3502
+ deepseek-r1-1.5b-packed/model_layers_25_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3503
+ deepseek-r1-1.5b-packed/model_layers_16_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3504
+ deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3505
+ deepseek-r1-1.5b-packed/model_layers_14_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3506
+ deepseek-r1-1.5b-packed/model_layers_15_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3507
+ deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3508
+ deepseek-r1-1.5b-packed/model_layers_8_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3509
+ deepseek-r1-1.5b-packed/model_layers_2_mlp_down_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3510
+ deepseek-r1-1.5b-packed/model_layers_23_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3511
+ deepseek-r1-1.5b-packed/model_layers_3_self_attn_q_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3512
+ deepseek-r1-1.5b-packed/model_layers_8_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3513
+ deepseek-r1-1.5b-packed/model_layers_25_self_attn_q_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3514
+ deepseek-r1-1.5b-packed/model_layers_3_self_attn_o_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3515
+ deepseek-r1-1.5b-packed/model_layers_2_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3516
+ deepseek-r1-1.5b-packed/model_layers_5_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3517
+ deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3518
+ deepseek-r1-1.5b-packed/model_layers_14_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3519
+ deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3520
+ deepseek-r1-1.5b-packed/model_layers_15_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3521
+ deepseek-r1-1.5b-packed/model_layers_25_self_attn_v_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3522
+ deepseek-r1-1.5b-packed/model_layers_7_mlp_up_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3523
+ deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3524
+ deepseek-r1-1.5b-packed/model_layers_16_mlp_down_proj_weight.signs filter=lfs diff=lfs merge=lfs -text
3525
+ deepseek-r1-1.5b-ternary/lm_head_weight.fp16 filter=lfs diff=lfs merge=lfs -text
3526
+ qwen3-4b-log-unary/model_layers_31_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
3527
+ qwen3-4b-log-unary/model_layers_11_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
3528
+ qwen3-4b-log-unary/model_layers_34_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
3529
+ deepseek-r1-1.5b-packed/model_layers_18_mlp_up_proj_weight.mags filter=lfs diff=lfs merge=lfs -text
3530
+ qwen3-4b-log-unary/model_layers_5_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
deepseek-r1-1.5b-packed/model_layers_0_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf601ab6062858b266017e3ccc33f77bb1a6560510ddb28d0bddd9822adbd0b
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_0_self_attn_o_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afa7c60db5e54d8009750dd241125670907a01f6b0741fecf14e3983914efbbe
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_10_mlp_down_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a5e09aa32752f84f4114b5b54e34265df514994b6c81f251137e17aacc70dbb
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_10_mlp_up_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:137cc07609c4da4aacd304b4fbb93a179102e1f1a78384d3e4f87c40eabb4810
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_10_self_attn_o_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa7257bc144ffb551a57b916fbc440d469b66da3d2d62118cb329f4b9ad9684e
3
+ size 2359296
deepseek-r1-1.5b-packed/model_layers_11_self_attn_o_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1b174d36ebc596462d284b4973fb866ce3a544714469cd4545b2c4cb7da12d3
3
+ size 2359296
deepseek-r1-1.5b-packed/model_layers_12_self_attn_q_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa8874205a1141bacaae9fdcf35ac12c56211a602ebefcde5e571e9429da90d4
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_13_mlp_down_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6075f12919d7c179856251bd7f4c167d128f7fe2438d968ab3be9eddbacc85a8
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_13_self_attn_q_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81f0c5fe941e1407a517b0d3ce5f3afad1ec859845e5f8c34fdcfffd5b310316
3
+ size 2359296
deepseek-r1-1.5b-packed/model_layers_14_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6a62b3e005442b9ac9a51a505347398cd9a43d80b5bedf204ae184f08a8c715
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_14_mlp_up_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:552bbc316a158a222d6c94d1b4d54de495b53cde5f3a4883ab9fba02cdbc62b8
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_14_self_attn_o_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0fde78bfd9522524f658236e046ecd0d2189aa0a092c9ddfb2577c3e982bc70
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_14_self_attn_q_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b1d71717a33bae43b6cc287107fa866ebf2d3a053742a709381035b2c234a66
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_15_mlp_down_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b684bcc0c65183e127d15e995f38140b7c7fa34626ffbdf52377bfd192205a9e
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_15_mlp_up_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5206a02260028ee28fbde6edf9df24199656473b0a98f2b038b7fc841608e572
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_15_self_attn_o_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a564f99a29539779b4e31ec8e2238c03ccace4c568b8495bd5028f5fc08e9416
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_16_mlp_down_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f627c09a596845e3d789efe2accb30b956cdad47f79f54fb9bc252285435cade
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_16_self_attn_o_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb4b96ddf727cc680c1f0360ff51b143b0e66d45792330cd4e0bb2edfb01ae96
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_18_mlp_up_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef5a4b93278c3ed4f21af7c482d30379e5399e1a9e60f402ce2e10198375909
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_18_self_attn_q_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cc73697f7d2c00e8a7ba5c1d7a5006479360a95f8a8860700b53aa831558a47
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_19_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3841fa4a3deed727ad7bbd14feddf9b931fa10c645be97f7a41d84cbcbd5b85d
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acdad830fec332f219ae63313954f982c97c74289dd00cd982dd76a421434b3a
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_19_mlp_up_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a04a4f84162379d5b772eb736221f21122838357c7f701c728b695f7f21f48f
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_1_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18d4f22d7a9844c265b8737f51512a8b9c3e83f8b3df30a048d2d1312bd89579
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_20_self_attn_v_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ca36ec8e518c40248700b7a6d036c79cfe6818c9bee9e9fed9db468c6a3076f
3
+ size 393216
deepseek-r1-1.5b-packed/model_layers_21_mlp_down_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67575cd43df52fa550be594f9da1901d582a2f2e48978a0044e5b366c6b1ae65
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_23_mlp_gate_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acab9a847d202ed9f67041eb8476855da21ec3afa42076c05927753fb95080eb
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_24_mlp_down_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86cca1f83a0b656b5b9e895a32797309e95088fbac4b80be1b53df380e4c1b66
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_24_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af1a304248edd39a9d41760fd0f5d5029c19e8b9c30b62f1b59b6c55fe0c3d5d
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_24_self_attn_q_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c4f9f5baf1b98926d34cf108276fbaa3befccc402d33ed2ed86280c02a46f99
3
+ size 2359296
deepseek-r1-1.5b-packed/model_layers_25_mlp_up_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85914f8567316fb3a505d76f4efbffddeda82b252fca0f004b115729fc5eece4
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_25_self_attn_q_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab7767bff8b90fbd314c81bdad8d407998989525b07c4ebab9ae1f804c7660ee
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_25_self_attn_v_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f6eb9e37e5d4eb688cd86bc5ca50b7458115f1c90782281a2af717a743ba43
3
+ size 393216
deepseek-r1-1.5b-packed/model_layers_26_mlp_down_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1514a78827202a31b5fabb4a56b194c40d60c75b42c2c473e509e90fd1ceec9
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_26_mlp_up_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92e1883be31668ba4dea2a96bb00286e7812c2309c109fefc110faf0d2ac552d
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_27_mlp_down_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b2a47c92099e72ef70301bb9d3098db3866a3c904a4172d87039e4d15aee85
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a20c45b40daed6a805b60745abd5a5e6d541b2b2bfc9ef541b476ca7743af229
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_27_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7742df58b2eb17912b598df0a2c405b98498924d8ff2523673d0c4d7137fa785
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7554f62302d4402c2a8617792efcdd9dcf3b22b78c3081170478e367959faab9
3
+ size 2359296
deepseek-r1-1.5b-packed/model_layers_27_self_attn_o_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f989aaae9b5c070f1c5236956b2a7a0c0821b0355b6556e2cf0dcc9f879a6117
3
+ size 294912
deepseek-r1-1.5b-packed/model_layers_2_mlp_down_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2950b33b7d98c3eb340722c3a5e376efb73136698d9c0aabdb09d9e2728117c2
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d99cdb9b5656662e94b69d5497d1ddc62b52fe4d5f9788c11249934c8ebc720
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_2_mlp_gate_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6acd236a009c2c646537035d07ed56d1f1a7e4bfd8e9b83a2e6c6ecf7c531bc8
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_2_mlp_up_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2208f57cf0144c098accb4a7145eda1e77cd1ffd2f9ca9f78b768badd53efcd
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_2_self_attn_q_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93da71f8a8f102d0d16d51aaad2da5559f0196f628efb9364557b2107970952c
3
+ size 2359296
deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1158378bb9adc7b73b040cd10215c0d6ba53d8916bbb732ca37b6bf8f4242eb2
3
+ size 13762560
deepseek-r1-1.5b-packed/model_layers_3_mlp_up_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd3b8fb93a12a2e9411ec693f5e761da80b09734ca758f2ddd06cb83365677bb
3
+ size 1720320
deepseek-r1-1.5b-packed/model_layers_3_self_attn_k_proj_weight.mags ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3be5411a8d1c31c6a292e80c20ecd2355a3c84d648686308d01022ad72523b6f
3
+ size 393216
deepseek-r1-1.5b-packed/model_layers_3_self_attn_o_proj_weight.signs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f794bbcdffd07b8719ce97780dab4eabc04d310bbe111dfba7f8205fb80b684
3
+ size 294912