OpenTransformer commited on
Commit
54c5b36
·
verified ·
1 Parent(s): ae4a44c

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +42 -0
  2. deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.scales +0 -0
  3. deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.sign +3 -0
  4. deepseek-r1-1.5b-unary4/model_layers_0_self_attn_v_proj_weight.scales +0 -0
  5. deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.planes +3 -0
  6. deepseek-r1-1.5b-unary4/model_layers_10_post_attention_layernorm_weight.fp16 +0 -0
  7. deepseek-r1-1.5b-unary4/model_layers_10_self_attn_k_proj_weight.sign +0 -0
  8. deepseek-r1-1.5b-unary4/model_layers_10_self_attn_v_proj_weight.sign +0 -0
  9. deepseek-r1-1.5b-unary4/model_layers_11_mlp_down_proj_weight.sign +3 -0
  10. deepseek-r1-1.5b-unary4/model_layers_11_mlp_up_proj_weight.scales +0 -0
  11. deepseek-r1-1.5b-unary4/model_layers_11_self_attn_k_proj_weight.scales +0 -0
  12. deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.planes +3 -0
  13. deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.scales +0 -0
  14. deepseek-r1-1.5b-unary4/model_layers_11_self_attn_v_proj_weight.planes +3 -0
  15. deepseek-r1-1.5b-unary4/model_layers_12_self_attn_k_proj_bias.fp16 +0 -0
  16. deepseek-r1-1.5b-unary4/model_layers_12_self_attn_o_proj_weight.sign +3 -0
  17. deepseek-r1-1.5b-unary4/model_layers_12_self_attn_v_proj_weight.scales +0 -0
  18. deepseek-r1-1.5b-unary4/model_layers_13_mlp_gate_proj_weight.scales +0 -0
  19. deepseek-r1-1.5b-unary4/model_layers_14_mlp_up_proj_weight.sign +3 -0
  20. deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_bias.fp16 +0 -0
  21. deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_weight.scales +0 -0
  22. deepseek-r1-1.5b-unary4/model_layers_16_input_layernorm_weight.fp16 +0 -0
  23. deepseek-r1-1.5b-unary4/model_layers_16_mlp_up_proj_weight.scales +0 -0
  24. deepseek-r1-1.5b-unary4/model_layers_16_post_attention_layernorm_weight.fp16 +0 -0
  25. deepseek-r1-1.5b-unary4/model_layers_16_self_attn_k_proj_bias.fp16 +0 -0
  26. deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.scales +0 -0
  27. deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.sign +0 -0
  28. deepseek-r1-1.5b-unary4/model_layers_17_mlp_up_proj_weight.planes +3 -0
  29. deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.planes +3 -0
  30. deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.scales +0 -0
  31. deepseek-r1-1.5b-unary4/model_layers_18_self_attn_k_proj_weight.planes +3 -0
  32. deepseek-r1-1.5b-unary4/model_layers_18_self_attn_o_proj_weight.sign +3 -0
  33. deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_bias.fp16 +0 -0
  34. deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_weight.sign +3 -0
  35. deepseek-r1-1.5b-unary4/model_layers_19_input_layernorm_weight.fp16 +0 -0
  36. deepseek-r1-1.5b-unary4/model_layers_19_self_attn_o_proj_weight.scales +0 -0
  37. deepseek-r1-1.5b-unary4/model_layers_19_self_attn_v_proj_weight.planes +3 -0
  38. deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.planes +3 -0
  39. deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.scales +0 -0
  40. deepseek-r1-1.5b-unary4/model_layers_1_self_attn_v_proj_weight.scales +0 -0
  41. deepseek-r1-1.5b-unary4/model_layers_20_self_attn_q_proj_bias.fp16 +0 -0
  42. deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.planes +3 -0
  43. deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.sign +3 -0
  44. deepseek-r1-1.5b-unary4/model_layers_21_self_attn_k_proj_weight.sign +0 -0
  45. deepseek-r1-1.5b-unary4/model_layers_21_self_attn_v_proj_weight.scales +0 -0
  46. deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.planes +3 -0
  47. deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.sign +3 -0
  48. deepseek-r1-1.5b-unary4/model_layers_22_mlp_up_proj_weight.scales +0 -0
  49. deepseek-r1-1.5b-unary4/model_layers_22_self_attn_o_proj_weight.scales +0 -0
  50. deepseek-r1-1.5b-unary4/model_layers_22_self_attn_v_proj_weight.scales +0 -0
.gitattributes CHANGED
@@ -2890,3 +2890,45 @@ qwen3-4b-log-unary/model_layers_27_self_attn_k_proj_weight.sign filter=lfs diff=
2890
  qwen3-4b-log-unary/model_layers_2_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2891
  qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2892
  qwen3-4b-log-unary/model_layers_31_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2890
  qwen3-4b-log-unary/model_layers_2_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2891
  qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2892
  qwen3-4b-log-unary/model_layers_31_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2893
+ deepseek-r1-1.5b-unary4/model_layers_11_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2894
+ deepseek-r1-1.5b-unary4/model_layers_4_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2895
+ deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2896
+ deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2897
+ deepseek-r1-1.5b-unary4/model_layers_26_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2898
+ deepseek-r1-1.5b-unary4/model_layers_6_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2899
+ deepseek-r1-1.5b-unary4/model_layers_18_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2900
+ deepseek-r1-1.5b-unary4/model_layers_27_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2901
+ deepseek-r1-1.5b-unary4/model_layers_27_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2902
+ deepseek-r1-1.5b-unary4/model_layers_27_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2903
+ deepseek-r1-1.5b-unary4/model_layers_18_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2904
+ deepseek-r1-1.5b-unary4/model_layers_19_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2905
+ deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2906
+ deepseek-r1-1.5b-unary4/model_layers_17_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2907
+ deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2908
+ deepseek-r1-1.5b-unary4/model_layers_7_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2909
+ deepseek-r1-1.5b-unary4/model_layers_3_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2910
+ deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2911
+ deepseek-r1-1.5b-unary4/model_layers_8_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2912
+ deepseek-r1-1.5b-unary4/model_layers_25_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2913
+ deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2914
+ deepseek-r1-1.5b-unary4/model_layers_27_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2915
+ deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2916
+ deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2917
+ deepseek-r1-1.5b-unary4/model_layers_25_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2918
+ deepseek-r1-1.5b-unary4/model_layers_5_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2919
+ deepseek-r1-1.5b-unary4/model_layers_2_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2920
+ deepseek-r1-1.5b-unary4/model_layers_27_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2921
+ deepseek-r1-1.5b-unary4/model_layers_3_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2922
+ deepseek-r1-1.5b-unary4/model_layers_11_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2923
+ deepseek-r1-1.5b-unary4/model_layers_24_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2924
+ deepseek-r1-1.5b-unary4/model_layers_23_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2925
+ deepseek-r1-1.5b-unary4/model_layers_5_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2926
+ deepseek-r1-1.5b-unary4/model_layers_14_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2927
+ deepseek-r1-1.5b-unary4/model_layers_12_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2928
+ deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2929
+ deepseek-r1-1.5b-unary4/model_layers_2_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2930
+ deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2931
+ deepseek-r1-1.5b-unary4/model_layers_23_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2932
+ deepseek-r1-1.5b-unary4/model_layers_25_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2933
+ deepseek-r1-1.5b-unary4/model_layers_2_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2934
+ deepseek-r1-1.5b-unary4/model_layers_5_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.scales ADDED
Binary file (35.8 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_0_mlp_gate_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf601ab6062858b266017e3ccc33f77bb1a6560510ddb28d0bddd9822adbd0b
3
+ size 1720320
deepseek-r1-1.5b-unary4/model_layers_0_self_attn_v_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_10_mlp_down_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f005c0c74e5f79d926d9db3cb02f312d03559c820b03e4d45eb1fc381f2d303f
3
+ size 6881280
deepseek-r1-1.5b-unary4/model_layers_10_post_attention_layernorm_weight.fp16 ADDED
Binary file (3.07 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_10_self_attn_k_proj_weight.sign ADDED
Binary file (49.2 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_10_self_attn_v_proj_weight.sign ADDED
Binary file (49.2 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_11_mlp_down_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b07cb8f37f8c3fb5f800b008ee48cc27f089db360aa642d7498bc09b8314e21c
3
+ size 1720320
deepseek-r1-1.5b-unary4/model_layers_11_mlp_up_proj_weight.scales ADDED
Binary file (35.8 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_k_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:391743aaf15f6307bc9b667a575007cea922b964c44b55499f683657c675cf1b
3
+ size 1179648
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_q_proj_weight.scales ADDED
Binary file (6.14 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_11_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e61fcc0005e9bc64d8257306654eacd8cf2a8b302e1b4c68c707f52b894c770f
3
+ size 196608
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_k_proj_bias.fp16 ADDED
Binary file (512 Bytes). View file
 
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_o_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b99c13197a9fd4d1233f95ba7aeaff88e06a93d91c95bb771fda4f56567a3cf2
3
+ size 294912
deepseek-r1-1.5b-unary4/model_layers_12_self_attn_v_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_13_mlp_gate_proj_weight.scales ADDED
Binary file (35.8 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_14_mlp_up_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71036189bc6c7101b6bebd0447e5613b8373df5f4687f35de2606e06905c73e1
3
+ size 1720320
deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_bias.fp16 ADDED
Binary file (512 Bytes). View file
 
deepseek-r1-1.5b-unary4/model_layers_15_self_attn_k_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_16_input_layernorm_weight.fp16 ADDED
Binary file (3.07 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_16_mlp_up_proj_weight.scales ADDED
Binary file (35.8 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_16_post_attention_layernorm_weight.fp16 ADDED
Binary file (3.07 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_16_self_attn_k_proj_bias.fp16 ADDED
Binary file (512 Bytes). View file
 
deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_16_self_attn_v_proj_weight.sign ADDED
Binary file (49.2 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_17_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a2696679b07fd134e164866f5fc097081e6905a936b75b9be2c75e60a811954
3
+ size 6881280
deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2e8be702da7bd0675f0f830d4b54f5bbb43f884a6f95dc438791e6c91be091e
3
+ size 1179648
deepseek-r1-1.5b-unary4/model_layers_17_self_attn_o_proj_weight.scales ADDED
Binary file (6.14 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_k_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa6452b5d4d246665da65f5db002758e0d27b5767dc46064f81d4b3fce597813
3
+ size 196608
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_o_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7809020bf04c489051e22e07494b20557ab1d7b99b6ac74741b55206a6092b4
3
+ size 294912
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_bias.fp16 ADDED
Binary file (3.07 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_18_self_attn_q_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cc73697f7d2c00e8a7ba5c1d7a5006479360a95f8a8860700b53aa831558a47
3
+ size 294912
deepseek-r1-1.5b-unary4/model_layers_19_input_layernorm_weight.fp16 ADDED
Binary file (3.07 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_19_self_attn_o_proj_weight.scales ADDED
Binary file (6.14 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_19_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6ad6327989a0def858d1449b0926b9ccdc0c3144690ab365e747325ea374779
3
+ size 196608
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42d7c59df70a966def7b8582254155515b7e5c85f6b4a9036fcca78e3e5dca48
3
+ size 1179648
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_o_proj_weight.scales ADDED
Binary file (6.14 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_1_self_attn_v_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_20_self_attn_q_proj_bias.fp16 ADDED
Binary file (3.07 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a0bba536126dbf01e52d8c8d2f5e1344e021358015f8d38aa27ce08a632112b
3
+ size 6881280
deepseek-r1-1.5b-unary4/model_layers_21_mlp_up_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154c898127685a5d1f62f4d132b2ddb359cf897cf0567784b03eff0baa5c31fb
3
+ size 1720320
deepseek-r1-1.5b-unary4/model_layers_21_self_attn_k_proj_weight.sign ADDED
Binary file (49.2 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_21_self_attn_v_proj_weight.scales ADDED
Binary file (1.02 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1513867e9552859d2ec309485f86a9bc766b34df35f2704a5c0a5182f459b138
3
+ size 6881280
deepseek-r1-1.5b-unary4/model_layers_22_mlp_gate_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cead535970fe45255a6aace0b589ee94e9ccc3daf2499e7af6e07d56599e3c3
3
+ size 1720320
deepseek-r1-1.5b-unary4/model_layers_22_mlp_up_proj_weight.scales ADDED
Binary file (35.8 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_22_self_attn_o_proj_weight.scales ADDED
Binary file (6.14 kB). View file
 
deepseek-r1-1.5b-unary4/model_layers_22_self_attn_v_proj_weight.scales ADDED
Binary file (1.02 kB). View file