wli1995 commited on
Commit
af30672
·
verified ·
1 Parent(s): ccfe43e

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +75 -0
  2. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l0_together.axmodel +3 -0
  3. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l10_together.axmodel +3 -0
  4. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l11_together.axmodel +3 -0
  5. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l12_together.axmodel +3 -0
  6. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l13_together.axmodel +3 -0
  7. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l14_together.axmodel +3 -0
  8. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l15_together.axmodel +3 -0
  9. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l16_together.axmodel +3 -0
  10. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l17_together.axmodel +3 -0
  11. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l18_together.axmodel +3 -0
  12. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l19_together.axmodel +3 -0
  13. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l1_together.axmodel +3 -0
  14. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l20_together.axmodel +3 -0
  15. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l21_together.axmodel +3 -0
  16. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l22_together.axmodel +3 -0
  17. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l23_together.axmodel +3 -0
  18. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l2_together.axmodel +3 -0
  19. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l3_together.axmodel +3 -0
  20. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l4_together.axmodel +3 -0
  21. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l5_together.axmodel +3 -0
  22. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l6_together.axmodel +3 -0
  23. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l7_together.axmodel +3 -0
  24. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l8_together.axmodel +3 -0
  25. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l9_together.axmodel +3 -0
  26. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_post.axmodel +3 -0
  27. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l0_together.axmodel +3 -0
  28. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l10_together.axmodel +3 -0
  29. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l11_together.axmodel +3 -0
  30. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l12_together.axmodel +3 -0
  31. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l13_together.axmodel +3 -0
  32. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l14_together.axmodel +3 -0
  33. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l15_together.axmodel +3 -0
  34. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l16_together.axmodel +3 -0
  35. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l17_together.axmodel +3 -0
  36. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l18_together.axmodel +3 -0
  37. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l19_together.axmodel +3 -0
  38. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l1_together.axmodel +3 -0
  39. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l20_together.axmodel +3 -0
  40. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l21_together.axmodel +3 -0
  41. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l22_together.axmodel +3 -0
  42. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l23_together.axmodel +3 -0
  43. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l2_together.axmodel +3 -0
  44. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l3_together.axmodel +3 -0
  45. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l4_together.axmodel +3 -0
  46. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l5_together.axmodel +3 -0
  47. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l6_together.axmodel +3 -0
  48. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l7_together.axmodel +3 -0
  49. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l8_together.axmodel +3 -0
  50. Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l9_together.axmodel +3 -0
.gitattributes CHANGED
@@ -33,3 +33,78 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
37
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
38
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
39
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
40
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
41
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
42
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
43
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
44
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
45
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
46
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
47
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
48
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
49
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
50
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
51
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
52
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
53
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
54
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
55
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
56
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
57
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
58
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
59
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
60
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
61
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
62
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
63
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
64
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
65
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
66
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
67
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
68
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
69
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
70
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
71
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
72
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
73
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
74
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
75
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
76
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
77
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
78
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
79
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
80
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
81
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
82
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
83
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
84
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
85
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
86
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
87
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
88
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
89
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
90
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
91
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
92
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
93
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
94
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
95
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
96
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
97
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
98
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
99
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
100
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
101
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
102
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
103
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
104
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
105
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
106
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
107
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
108
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
109
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
110
+ Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l0_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33815de53b3271fc6d8c8fab337f34208c6014fd15adf9503a81910b9c14193a
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l10_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f45f37db004356b484887d2e6ea85ff3e276877475e0eca93c992bbdc87edc6b
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l11_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11042aa405c8f60c16312bd101f8984013bb9194beccac6668b240433acec0ee
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l12_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:455b916a847a4eaef436e5462678b453cf6483feca2b3896e3d71fd57ef7c1fd
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l13_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:108f8301db0b77ab5ca583be5c4e0411d1522bd8dc0ebda808839863a814d4e9
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l14_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68bcddd4e29d160543a5556e690d85a573f599eeb829d76b6bc41feddc9eb892
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l15_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4441623f6106256bd784e80b0e252ed64a187e9ea2ee7366ea3f7f5154db04
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l16_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00e977e1810910508bbe72c0d4e37abdf2e1ec28358d16a0dd99b88ce2151753
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l17_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:493a462f25abccdc507c240cfb797d74685ea3f5019cbb8a61395e86f0eeef43
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l18_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0187028b3c2b30929f65417995f9d12bbe37962a270173c9164c17231e8b6be9
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l19_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2440f30d43b6096b6a33dd6f23c2c5b6e7abda721ab82fc515b678e9f6353e11
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l1_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bd33b3867dc10e9a657161c0345e3e2a07e73b7b8d0e48a181aa4d3b2247e94
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l20_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b43af5cae0c99b4d9d61d03a11d4fddf6f8d86020cd55f048688f6b8a28d04d
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l21_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a50dd25ce181117ddd28ce022c23310dad502c2df4a8128b283413f9da16f0a
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l22_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dfa212458d8caa700c42bc9a6731171982b581721436c6dca2b1cb899d164cd
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l23_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a292391265ac4d74e48df7644f7fbe708867f204b6cce08827cbb4408bf00c8
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l2_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60b4d677f094bbd9e9033d6bbd4d6c784638017965e5017487a2a228f892a88e
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l3_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e387c072e828941bc1505ad737874dea3b3507f4bdcd850ab88814c1c5b83a2
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l4_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74c8d6b70bd559f89583a28b54cfab7484f6cc4b8cdb009b603626a64e144c25
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l5_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ca669414409a4450d278cbd261a43a18bfd183f70c045e15e71e5cd2a093f66
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l6_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:166212dbc41ef15d23333f3cfa0f884e53dc5a079c99fc7b036ac6967b7b2ad4
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l7_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4715485bf999fe090655ae92af76b8a4e49a8e84abb33e3bc446af90dc3dd3e5
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l8_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcd04a53d1c61dab02dd81a6e5177faad319000c3558e7ff9dc761cb07cbf013
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l9_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1adf994780024738ff01afd32726ad4c610ace7657f10616bd4bb0451f5fed8
3
+ size 12705233
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_post.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a70bca0bc2f8d8c3754f4aa567e558a06ad37fd3fdf47b1ab1131e6c16062e95
3
+ size 147954858
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l0_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ddaa40c0e74f34a66e807975a121d8673c6eb7d2e4970f39fbb1c863cc12809
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l10_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f16fd94628ecafc0648c14344f4ca5cceef3fd562e35ee5e9129e2b83fb3fddd
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l11_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:430fb2a9e88313643ed73db9942214787472849dade524f7cbf201ab52202878
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l12_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74ed83ec7920e1dbeaaed08e13de1127b6770bbaa7cd9da8436fb8f8513d4e07
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l13_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f95bc9f8db35d9ddd7afb21ad46c74f5fe9a68acc791bf0586428d4d618552d
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l14_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de72db5e8180d929e728d64db63e8e784a798fbb1651f2558546fa952151709c
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l15_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1991082fcbecbd4e14127000e75b0831d6c30526fdb41589dd3fd7bc14eb4f20
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l16_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5935978a8ae85f2c390161d05b22a8c322e5ff3616eba596dea8f990fb271daa
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l17_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:417d780b4d5efea7c23018e3f0f2500789358357c45dc33b12e460fcc12cd1cb
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l18_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b832312ea3411431452b23a317e8a624010f2b502e3dabf150014d96e4e6d11
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l19_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23019163daffe863501bd51efc7984fd851209eec6d61af32cb7d11bb5f09dc5
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l1_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41ba7738d7cfab51bc3a9bb9fcb25bb9e013a56e4f51d0040685f273a146a993
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l20_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e9bb54157f84f4fa50aeea9eed00ca0c31a091493231d49239e5943b80b3ff0
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l21_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1984110b1871b45e854903c7db3891a18c1d83e7f0c16dbaeb7b5f902653109e
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l22_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd144a977c21583d9cc1e1f0cf4960c7288cdf4f1c1a798f3fc97ff47952d694
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l23_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f17e98b589f47f9530cfd754472a3953ca790fbd2e60fa12766f35b420c2368d
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l2_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe23f5af252219bf430c8f9017e9f0136006a24354daef14ddd6feaccf1666f2
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l3_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1449c8aadc9f3f735cc6e4c1c7fc9d4777c4f2217da33a6b3145989beb575588
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l4_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00d69fac32ba1bc654a2466ecd1fda2bc584f98f8da887584cfa79d4150c7b83
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l5_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5108c4cf6d94436bef0850a9c3292d5b2454fa729f52cccd63e4af53c91e9dd
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l6_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ccb86670b27ac12fb320e016d7b713e3d822a073ba8bd6876365d9e10ec1b6
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l7_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a8d43fd1bbc8132d14cc2f22aa7e6edf8efb9906b46c81fe4333a923b2360e4
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l8_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71e8f81d7340b319d14bf842f9ea55c6de65f3ac20303e7e3dfe93798b66687d
3
+ size 11687781
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l9_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d11985fc109897bfe8742f77610d0b84286183cd683b7af81a595605cebbd635
3
+ size 11687781