OpenTransformer commited on
Commit
890ede8
·
verified ·
1 Parent(s): 1889569

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +125 -0
  2. qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.planes +3 -0
  3. qwen3-4b-log-unary/model_layers_0_self_attn_q_proj_weight.planes +3 -0
  4. qwen3-4b-log-unary/model_layers_0_self_attn_v_proj_weight.planes +3 -0
  5. qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes +3 -0
  6. qwen3-4b-log-unary/model_layers_10_self_attn_o_proj_weight.planes +3 -0
  7. qwen3-4b-log-unary/model_layers_10_self_attn_v_proj_weight.planes +3 -0
  8. qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.sign +3 -0
  9. qwen3-4b-log-unary/model_layers_11_self_attn_v_proj_weight.sign +3 -0
  10. qwen3-4b-log-unary/model_layers_12_mlp_up_proj_weight.planes +3 -0
  11. qwen3-4b-log-unary/model_layers_13_mlp_gate_proj_weight.sign +3 -0
  12. qwen3-4b-log-unary/model_layers_13_mlp_up_proj_weight.planes +3 -0
  13. qwen3-4b-log-unary/model_layers_13_mlp_up_proj_weight.sign +3 -0
  14. qwen3-4b-log-unary/model_layers_13_self_attn_k_proj_weight.planes +3 -0
  15. qwen3-4b-log-unary/model_layers_13_self_attn_q_proj_weight.planes +3 -0
  16. qwen3-4b-log-unary/model_layers_14_mlp_down_proj_weight.sign +3 -0
  17. qwen3-4b-log-unary/model_layers_14_self_attn_k_proj_weight.sign +3 -0
  18. qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.planes +3 -0
  19. qwen3-4b-log-unary/model_layers_15_mlp_down_proj_weight.sign +3 -0
  20. qwen3-4b-log-unary/model_layers_15_mlp_gate_proj_weight.planes +3 -0
  21. qwen3-4b-log-unary/model_layers_15_mlp_up_proj_weight.planes +3 -0
  22. qwen3-4b-log-unary/model_layers_15_self_attn_o_proj_weight.planes +3 -0
  23. qwen3-4b-log-unary/model_layers_15_self_attn_o_proj_weight.sign +3 -0
  24. qwen3-4b-log-unary/model_layers_15_self_attn_q_proj_weight.planes +3 -0
  25. qwen3-4b-log-unary/model_layers_15_self_attn_v_proj_weight.planes +3 -0
  26. qwen3-4b-log-unary/model_layers_15_self_attn_v_proj_weight.sign +3 -0
  27. qwen3-4b-log-unary/model_layers_16_mlp_down_proj_weight.sign +3 -0
  28. qwen3-4b-log-unary/model_layers_16_mlp_up_proj_weight.planes +3 -0
  29. qwen3-4b-log-unary/model_layers_16_self_attn_q_proj_weight.planes +3 -0
  30. qwen3-4b-log-unary/model_layers_16_self_attn_v_proj_weight.planes +3 -0
  31. qwen3-4b-log-unary/model_layers_16_self_attn_v_proj_weight.sign +3 -0
  32. qwen3-4b-log-unary/model_layers_17_mlp_gate_proj_weight.planes +3 -0
  33. qwen3-4b-log-unary/model_layers_17_mlp_gate_proj_weight.sign +3 -0
  34. qwen3-4b-log-unary/model_layers_17_self_attn_k_proj_weight.planes +3 -0
  35. qwen3-4b-log-unary/model_layers_17_self_attn_k_proj_weight.sign +3 -0
  36. qwen3-4b-log-unary/model_layers_17_self_attn_q_proj_weight.sign +3 -0
  37. qwen3-4b-log-unary/model_layers_18_self_attn_o_proj_weight.planes +3 -0
  38. qwen3-4b-log-unary/model_layers_18_self_attn_q_proj_weight.planes +3 -0
  39. qwen3-4b-log-unary/model_layers_19_mlp_down_proj_weight.planes +3 -0
  40. qwen3-4b-log-unary/model_layers_19_mlp_down_proj_weight.sign +3 -0
  41. qwen3-4b-log-unary/model_layers_19_mlp_up_proj_weight.planes +3 -0
  42. qwen3-4b-log-unary/model_layers_19_mlp_up_proj_weight.sign +3 -0
  43. qwen3-4b-log-unary/model_layers_1_mlp_down_proj_weight.sign +3 -0
  44. qwen3-4b-log-unary/model_layers_1_self_attn_k_proj_weight.planes +3 -0
  45. qwen3-4b-log-unary/model_layers_1_self_attn_k_proj_weight.sign +3 -0
  46. qwen3-4b-log-unary/model_layers_20_mlp_down_proj_weight.planes +3 -0
  47. qwen3-4b-log-unary/model_layers_20_mlp_up_proj_weight.sign +3 -0
  48. qwen3-4b-log-unary/model_layers_20_self_attn_o_proj_weight.sign +3 -0
  49. qwen3-4b-log-unary/model_layers_20_self_attn_q_proj_weight.sign +3 -0
  50. qwen3-4b-log-unary/model_layers_20_self_attn_v_proj_weight.planes +3 -0
.gitattributes CHANGED
@@ -2765,3 +2765,128 @@ deepseek-r1-1.5b-ternary/model_layers_2_self_attn_o_proj_weight.pos filter=lfs d
2765
  deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
2766
  deepseek-r1-1.5b-ternary/model_layers_9_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
2767
  deepseek-r1-1.5b-ternary/model_layers_16_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2765
  deepseek-r1-1.5b-ternary/model_layers_19_mlp_up_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
2766
  deepseek-r1-1.5b-ternary/model_layers_9_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
2767
  deepseek-r1-1.5b-ternary/model_layers_16_self_attn_o_proj_weight.neg filter=lfs diff=lfs merge=lfs -text
2768
+ qwen3-4b-log-unary/model_layers_5_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2769
+ qwen3-4b-log-unary/model_layers_18_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2770
+ qwen3-4b-log-unary/model_layers_30_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2771
+ qwen3-4b-log-unary/model_layers_7_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2772
+ qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2773
+ qwen3-4b-log-unary/model_layers_4_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2774
+ qwen3-4b-log-unary/model_layers_2_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2775
+ qwen3-4b-log-unary/model_layers_21_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2776
+ qwen3-4b-log-unary/model_layers_14_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2777
+ qwen3-4b-log-unary/model_layers_26_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2778
+ qwen3-4b-log-unary/model_layers_19_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2779
+ qwen3-4b-log-unary/model_layers_20_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2780
+ qwen3-4b-log-unary/model_layers_26_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2781
+ qwen3-4b-log-unary/model_layers_27_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2782
+ qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2783
+ qwen3-4b-log-unary/model_layers_29_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2784
+ qwen3-4b-log-unary/model_layers_17_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2785
+ qwen3-4b-log-unary/model_layers_15_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2786
+ qwen3-4b-log-unary/model_layers_10_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2787
+ qwen3-4b-log-unary/model_layers_35_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2788
+ qwen3-4b-log-unary/model_layers_19_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2789
+ qwen3-4b-log-unary/model_layers_6_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2790
+ qwen3-4b-log-unary/model_layers_5_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2791
+ qwen3-4b-log-unary/model_layers_4_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2792
+ qwen3-4b-log-unary/model_layers_28_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2793
+ qwen3-4b-log-unary/model_layers_35_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2794
+ qwen3-4b-log-unary/model_layers_31_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2795
+ qwen3-4b-log-unary/model_layers_2_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2796
+ qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2797
+ qwen3-4b-log-unary/model_layers_16_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2798
+ qwen3-4b-log-unary/model_layers_9_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2799
+ qwen3-4b-log-unary/model_layers_22_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2800
+ qwen3-4b-log-unary/model_layers_27_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2801
+ qwen3-4b-log-unary/model_layers_16_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2802
+ qwen3-4b-log-unary/model_layers_15_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2803
+ qwen3-4b-log-unary/model_layers_31_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2804
+ qwen3-4b-log-unary/model_layers_16_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2805
+ qwen3-4b-log-unary/model_layers_33_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2806
+ qwen3-4b-log-unary/model_layers_33_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2807
+ qwen3-4b-log-unary/model_layers_17_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2808
+ qwen3-4b-log-unary/model_layers_13_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2809
+ qwen3-4b-log-unary/model_layers_6_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2810
+ qwen3-4b-log-unary/model_layers_17_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2811
+ qwen3-4b-log-unary/model_layers_4_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2812
+ qwen3-4b-log-unary/model_layers_9_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2813
+ qwen3-4b-log-unary/model_layers_24_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2814
+ qwen3-4b-log-unary/model_layers_17_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2815
+ qwen3-4b-log-unary/model_layers_9_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2816
+ qwen3-4b-log-unary/model_layers_6_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2817
+ qwen3-4b-log-unary/model_layers_27_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2818
+ qwen3-4b-log-unary/model_layers_30_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2819
+ qwen3-4b-log-unary/model_layers_13_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2820
+ qwen3-4b-log-unary/model_layers_8_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2821
+ qwen3-4b-log-unary/model_layers_28_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2822
+ qwen3-4b-log-unary/model_layers_4_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2823
+ qwen3-4b-log-unary/model_layers_4_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2824
+ qwen3-4b-log-unary/model_layers_19_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2825
+ qwen3-4b-log-unary/model_layers_10_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2826
+ qwen3-4b-log-unary/model_layers_11_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2827
+ qwen3-4b-log-unary/model_layers_18_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2828
+ qwen3-4b-log-unary/model_layers_15_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2829
+ qwen3-4b-log-unary/model_layers_21_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2830
+ qwen3-4b-log-unary/model_layers_5_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2831
+ qwen3-4b-log-unary/model_layers_9_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2832
+ qwen3-4b-log-unary/model_layers_3_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2833
+ qwen3-4b-log-unary/model_layers_0_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2834
+ qwen3-4b-log-unary/model_layers_1_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2835
+ qwen3-4b-log-unary/model_layers_12_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2836
+ qwen3-4b-log-unary/model_layers_25_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2837
+ qwen3-4b-log-unary/model_layers_8_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2838
+ qwen3-4b-log-unary/model_layers_3_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2839
+ qwen3-4b-log-unary/model_layers_1_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2840
+ qwen3-4b-log-unary/model_layers_13_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2841
+ qwen3-4b-log-unary/model_layers_5_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2842
+ qwen3-4b-log-unary/model_layers_20_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2843
+ qwen3-4b-log-unary/model_layers_15_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2844
+ qwen3-4b-log-unary/model_layers_17_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2845
+ qwen3-4b-log-unary/model_layers_4_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2846
+ qwen3-4b-log-unary/model_layers_20_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2847
+ qwen3-4b-log-unary/model_layers_24_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2848
+ qwen3-4b-log-unary/model_layers_34_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2849
+ qwen3-4b-log-unary/model_layers_20_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2850
+ qwen3-4b-log-unary/model_layers_24_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2851
+ qwen3-4b-log-unary/model_layers_21_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2852
+ qwen3-4b-log-unary/model_layers_13_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2853
+ qwen3-4b-log-unary/model_layers_25_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2854
+ qwen3-4b-log-unary/model_layers_30_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2855
+ qwen3-4b-log-unary/model_layers_27_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2856
+ qwen3-4b-log-unary/model_layers_15_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2857
+ qwen3-4b-log-unary/model_layers_16_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2858
+ qwen3-4b-log-unary/model_layers_22_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2859
+ qwen3-4b-log-unary/model_layers_29_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2860
+ qwen3-4b-log-unary/model_layers_22_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2861
+ qwen3-4b-log-unary/model_layers_29_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2862
+ qwen3-4b-log-unary/model_layers_34_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2863
+ qwen3-4b-log-unary/model_layers_26_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2864
+ qwen3-4b-log-unary/model_layers_33_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2865
+ qwen3-4b-log-unary/model_layers_24_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2866
+ qwen3-4b-log-unary/model_layers_13_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2867
+ qwen3-4b-log-unary/model_layers_33_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2868
+ qwen3-4b-log-unary/model_layers_23_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2869
+ qwen3-4b-log-unary/model_layers_9_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2870
+ qwen3-4b-log-unary/model_layers_16_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2871
+ qwen3-4b-log-unary/model_layers_35_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2872
+ qwen3-4b-log-unary/model_layers_0_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2873
+ qwen3-4b-log-unary/model_layers_29_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2874
+ qwen3-4b-log-unary/model_layers_27_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2875
+ qwen3-4b-log-unary/model_layers_35_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2876
+ qwen3-4b-log-unary/model_layers_28_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2877
+ qwen3-4b-log-unary/model_layers_29_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2878
+ qwen3-4b-log-unary/model_layers_20_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2879
+ qwen3-4b-log-unary/model_layers_15_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2880
+ qwen3-4b-log-unary/model_layers_15_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2881
+ qwen3-4b-log-unary/model_layers_24_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2882
+ qwen3-4b-log-unary/model_layers_14_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2883
+ qwen3-4b-log-unary/model_layers_19_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2884
+ qwen3-4b-log-unary/model_layers_2_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2885
+ qwen3-4b-log-unary/model_layers_6_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2886
+ qwen3-4b-log-unary/model_layers_15_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2887
+ qwen3-4b-log-unary/model_layers_4_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2888
+ qwen3-4b-log-unary/model_layers_1_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2889
+ qwen3-4b-log-unary/model_layers_27_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
2890
+ qwen3-4b-log-unary/model_layers_2_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2891
+ qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text
2892
+ qwen3-4b-log-unary/model_layers_31_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text
qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f889c04a60a3f6458bf9d2efef22160fbebc2480c728190a58cf5f87fadf2ea
3
+ size 1310720
qwen3-4b-log-unary/model_layers_0_self_attn_q_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdfa9285e4a6d99f7bfb87889274d7960d74a7926e9bf71ef240acbe38b88752
3
+ size 5242880
qwen3-4b-log-unary/model_layers_0_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f48ba788fbc1d12c56e8dd69897274104445c98f4356b6bdf7976f22c0456d9
3
+ size 1310720
qwen3-4b-log-unary/model_layers_10_mlp_gate_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:115a2b520d7f32dab11d5f24ed0cc8d570ca89d51b1b5a66ed98b98f4a01f50e
3
+ size 12451840
qwen3-4b-log-unary/model_layers_10_self_attn_o_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea22b3c32fefdbdc3e1a11a241caa1ec989709178c5e13457d0cfe99019a048a
3
+ size 5242880
qwen3-4b-log-unary/model_layers_10_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c44fb623369c3927bea884407fdcb26b5a9568945d1bfd146ab75a93061f83d2
3
+ size 1310720
qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7707d7f57d28e0acbcecf85f8ea6e6962fada16ac49144d4e1e1a8ccc94a6bf
3
+ size 3112960
qwen3-4b-log-unary/model_layers_11_self_attn_v_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c006a897731a1626b9c2c1c4ca2551d511740a2f661df4d14815ae4128a7102f
3
+ size 327680
qwen3-4b-log-unary/model_layers_12_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6256f4e31ce00753c240f6e83c14bef9d9a26b2ed796bd2fed667e54cff474c2
3
+ size 12451840
qwen3-4b-log-unary/model_layers_13_mlp_gate_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92483a3170be7725daac8875db930d5f1164cbd9ca7d11001e43f4ecf5837a0
3
+ size 3112960
qwen3-4b-log-unary/model_layers_13_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d29086a56bd8b26b987d67597284546ffda13dd1ea9ef13835614615990adfdf
3
+ size 12451840
qwen3-4b-log-unary/model_layers_13_mlp_up_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62d5b9a1e4b72963d770eb778bdbedc23b556e67fba73b1357e00c2124e4f075
3
+ size 3112960
qwen3-4b-log-unary/model_layers_13_self_attn_k_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c33c569521d0324bd8a95701f63bd8ce75ffdc4c0dcbe20e50ae403ac0065e23
3
+ size 1310720
qwen3-4b-log-unary/model_layers_13_self_attn_q_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54d53a03335353a6571665edc0d43c4d8cdd5389696c5622a21248608326963
3
+ size 5242880
qwen3-4b-log-unary/model_layers_14_mlp_down_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dfc1fbf8f6518bdd71a4174b204c5636b4acf2b9752455fc28cd6d995343265
3
+ size 3112960
qwen3-4b-log-unary/model_layers_14_self_attn_k_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ada7a3551e9626f9d2d29efae97c425bfbea3c549de55b56ea3c6797c0c19bb
3
+ size 327680
qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f74814798f37e654d60401fef9f23e7e1065e1843d612a360c090cf61b2a51d
3
+ size 5242880
qwen3-4b-log-unary/model_layers_15_mlp_down_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:198aa7285ac7988c1b4d22ab20e1cff545d7c169f0ca8db679bf0e5361756d6a
3
+ size 3112960
qwen3-4b-log-unary/model_layers_15_mlp_gate_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fdf4cda4c51043f4aa8483b12f95153f2d9b8e0de676bb916129220b0b1f3cd
3
+ size 12451840
qwen3-4b-log-unary/model_layers_15_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8846640d3a96ba070921e81615723ce992ef6b8ba203029175a662df8d6a0c3
3
+ size 12451840
qwen3-4b-log-unary/model_layers_15_self_attn_o_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de21d4d6298001caaf900cc67e086b1a3a23c5fb2f0ddd0864a18ab52a4f3f2f
3
+ size 5242880
qwen3-4b-log-unary/model_layers_15_self_attn_o_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7f71af7f47151a4dce6d3dd9a1b6f2e44e3589a3436faa991a6ed268fad77c9
3
+ size 1310720
qwen3-4b-log-unary/model_layers_15_self_attn_q_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8ae7e0b84d6c563ba2d7db64e36fc1a931b0eede950ae8869c0b90755a9116b
3
+ size 5242880
qwen3-4b-log-unary/model_layers_15_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e4c5d23444748e86b09338e44d5999471af8237b182252bab49f2c4e143c771
3
+ size 1310720
qwen3-4b-log-unary/model_layers_15_self_attn_v_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b40193c724d798f6177f6910c45e179c50cb4d637f7964fba42d4e97862231fa
3
+ size 327680
qwen3-4b-log-unary/model_layers_16_mlp_down_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bea96aabc737dfbe645a8503d75e1d1352a089a36690fde5ab49bcf72a220f5e
3
+ size 3112960
qwen3-4b-log-unary/model_layers_16_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21694fb071f5955172dd0b73acd4ac9fb3885ee30aca73928a079a93bbab46fc
3
+ size 12451840
qwen3-4b-log-unary/model_layers_16_self_attn_q_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33428699aa8f9b44a7303ed8320eebf76f6387a463606bf01d1ee449e9552a69
3
+ size 5242880
qwen3-4b-log-unary/model_layers_16_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dd041fd4a7165421fcb13f9006c858a7573333a163aac494264b50e9ff55f82
3
+ size 1310720
qwen3-4b-log-unary/model_layers_16_self_attn_v_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ccdcd9dc6af201791934b5ce7c0651d63e130024291b6cac7d65e72fc1c49d0
3
+ size 327680
qwen3-4b-log-unary/model_layers_17_mlp_gate_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b9e75d82b79732b43a70fdd6e0bb275100c0047d15fda6b430570c93b387ce1
3
+ size 12451840
qwen3-4b-log-unary/model_layers_17_mlp_gate_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3467af08d628ef1f27afd05057a4138aeadd9038027c44a99350d727638e9dae
3
+ size 3112960
qwen3-4b-log-unary/model_layers_17_self_attn_k_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c3f5f83a755cf3508baffcbb802b59e7314667ff48435e47f680a695e60ee94
3
+ size 1310720
qwen3-4b-log-unary/model_layers_17_self_attn_k_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1592399845312ad0cdf7055f68f5cdcca88c49d819658d9db66d072cd28b2521
3
+ size 327680
qwen3-4b-log-unary/model_layers_17_self_attn_q_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15a9d2352133200bac5afb6f6b1a4ad867218dfd9657b68b10872e320489e69e
3
+ size 1310720
qwen3-4b-log-unary/model_layers_18_self_attn_o_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:181ebb30af9a068368c043583bedd361c5ac9a1189e495a43e6f54fdf293a6e8
3
+ size 5242880
qwen3-4b-log-unary/model_layers_18_self_attn_q_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f198b000e64941269b357c48596e6cc25be8a2e0717f1426e0c421b23977a97
3
+ size 5242880
qwen3-4b-log-unary/model_layers_19_mlp_down_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c640a071b959ddb72787ed152b95fbfb48025ac721fd8750d977226aa96d25f
3
+ size 12451840
qwen3-4b-log-unary/model_layers_19_mlp_down_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:768d1ed8e30ac5a838bafb41a32b5825d85340ca5e3b949045f5db3b40f1eef0
3
+ size 3112960
qwen3-4b-log-unary/model_layers_19_mlp_up_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98dbcb44a9cbd6e357c699c84a5781f4f511a894d202baf40a92ccece5edf67c
3
+ size 12451840
qwen3-4b-log-unary/model_layers_19_mlp_up_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc5ba0a21e7ace88f747666d134ef8d8b72e6399be7d7f1e3352ef80cde60926
3
+ size 3112960
qwen3-4b-log-unary/model_layers_1_mlp_down_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3efaa0fb1a3cad08898a421edd75922b7e3e02d3ef68ea270503860c55f69f9b
3
+ size 3112960
qwen3-4b-log-unary/model_layers_1_self_attn_k_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:532bed4de5e126cd24144ec4a2665dd17634def94b32ea4cf511c01d905c79c9
3
+ size 1310720
qwen3-4b-log-unary/model_layers_1_self_attn_k_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb89dbb43658e6e97a8823da521c09f5de4fa35cb43325798f263ebf47483e42
3
+ size 327680
qwen3-4b-log-unary/model_layers_20_mlp_down_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7edf950deecedfbfbdde9bb748cd664545067efe3923d1392753acec2b724f0c
3
+ size 12451840
qwen3-4b-log-unary/model_layers_20_mlp_up_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4304319b73d59696175e2494c259f77a1af1a6c83a22f5e3bcd0fe9a04ae2c67
3
+ size 3112960
qwen3-4b-log-unary/model_layers_20_self_attn_o_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e088685284a9020c6469e034ecde8e0f7cd8ed0bc46c58f6c7bdb1cb4a76cc96
3
+ size 1310720
qwen3-4b-log-unary/model_layers_20_self_attn_q_proj_weight.sign ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcc00e8cbdb6631e9844b8f591ae92d6c9a5d312ef69910daecb04ddef35cb03
3
+ size 1310720
qwen3-4b-log-unary/model_layers_20_self_attn_v_proj_weight.planes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e945bb7b4672cbb2e8066c10513ea16f8b7b5608a7089e0ee8b8ae6b13f002fa
3
+ size 1310720