Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +75 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l0_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l10_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l11_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l12_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l13_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l14_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l15_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l16_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l17_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l18_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l19_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l1_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l20_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l21_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l22_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l23_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l2_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l3_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l4_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l5_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l6_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l7_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l8_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l9_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_post.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l0_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l10_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l11_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l12_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l13_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l14_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l15_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l16_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l17_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l18_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l19_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l1_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l20_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l21_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l22_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l23_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l2_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l3_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l4_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l5_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l6_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l7_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l8_together.axmodel +3 -0
- Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l9_together.axmodel +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,78 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 108 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 109 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 110 |
+
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1k/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l0_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33815de53b3271fc6d8c8fab337f34208c6014fd15adf9503a81910b9c14193a
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l10_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f45f37db004356b484887d2e6ea85ff3e276877475e0eca93c992bbdc87edc6b
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l11_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11042aa405c8f60c16312bd101f8984013bb9194beccac6668b240433acec0ee
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l12_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:455b916a847a4eaef436e5462678b453cf6483feca2b3896e3d71fd57ef7c1fd
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l13_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:108f8301db0b77ab5ca583be5c4e0411d1522bd8dc0ebda808839863a814d4e9
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l14_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68bcddd4e29d160543a5556e690d85a573f599eeb829d76b6bc41feddc9eb892
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l15_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff4441623f6106256bd784e80b0e252ed64a187e9ea2ee7366ea3f7f5154db04
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l16_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:00e977e1810910508bbe72c0d4e37abdf2e1ec28358d16a0dd99b88ce2151753
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l17_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:493a462f25abccdc507c240cfb797d74685ea3f5019cbb8a61395e86f0eeef43
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l18_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0187028b3c2b30929f65417995f9d12bbe37962a270173c9164c17231e8b6be9
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l19_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2440f30d43b6096b6a33dd6f23c2c5b6e7abda721ab82fc515b678e9f6353e11
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l1_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9bd33b3867dc10e9a657161c0345e3e2a07e73b7b8d0e48a181aa4d3b2247e94
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l20_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b43af5cae0c99b4d9d61d03a11d4fddf6f8d86020cd55f048688f6b8a28d04d
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l21_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a50dd25ce181117ddd28ce022c23310dad502c2df4a8128b283413f9da16f0a
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l22_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1dfa212458d8caa700c42bc9a6731171982b581721436c6dca2b1cb899d164cd
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l23_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a292391265ac4d74e48df7644f7fbe708867f204b6cce08827cbb4408bf00c8
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l2_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60b4d677f094bbd9e9033d6bbd4d6c784638017965e5017487a2a228f892a88e
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l3_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e387c072e828941bc1505ad737874dea3b3507f4bdcd850ab88814c1c5b83a2
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l4_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74c8d6b70bd559f89583a28b54cfab7484f6cc4b8cdb009b603626a64e144c25
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l5_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ca669414409a4450d278cbd261a43a18bfd183f70c045e15e71e5cd2a093f66
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l6_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:166212dbc41ef15d23333f3cfa0f884e53dc5a079c99fc7b036ac6967b7b2ad4
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l7_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4715485bf999fe090655ae92af76b8a4e49a8e84abb33e3bc446af90dc3dd3e5
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l8_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bcd04a53d1c61dab02dd81a6e5177faad319000c3558e7ff9dc761cb07cbf013
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_p128_l9_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1adf994780024738ff01afd32726ad4c610ace7657f10616bd4bb0451f5fed8
|
| 3 |
+
size 12705233
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2500-prefill-2k/qwen2_post.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a70bca0bc2f8d8c3754f4aa567e558a06ad37fd3fdf47b1ab1131e6c16062e95
|
| 3 |
+
size 147954858
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l0_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ddaa40c0e74f34a66e807975a121d8673c6eb7d2e4970f39fbb1c863cc12809
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l10_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f16fd94628ecafc0648c14344f4ca5cceef3fd562e35ee5e9129e2b83fb3fddd
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l11_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:430fb2a9e88313643ed73db9942214787472849dade524f7cbf201ab52202878
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l12_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74ed83ec7920e1dbeaaed08e13de1127b6770bbaa7cd9da8436fb8f8513d4e07
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l13_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f95bc9f8db35d9ddd7afb21ad46c74f5fe9a68acc791bf0586428d4d618552d
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l14_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de72db5e8180d929e728d64db63e8e784a798fbb1651f2558546fa952151709c
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l15_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1991082fcbecbd4e14127000e75b0831d6c30526fdb41589dd3fd7bc14eb4f20
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l16_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5935978a8ae85f2c390161d05b22a8c322e5ff3616eba596dea8f990fb271daa
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l17_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:417d780b4d5efea7c23018e3f0f2500789358357c45dc33b12e460fcc12cd1cb
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l18_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b832312ea3411431452b23a317e8a624010f2b502e3dabf150014d96e4e6d11
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l19_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23019163daffe863501bd51efc7984fd851209eec6d61af32cb7d11bb5f09dc5
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l1_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41ba7738d7cfab51bc3a9bb9fcb25bb9e013a56e4f51d0040685f273a146a993
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l20_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e9bb54157f84f4fa50aeea9eed00ca0c31a091493231d49239e5943b80b3ff0
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l21_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1984110b1871b45e854903c7db3891a18c1d83e7f0c16dbaeb7b5f902653109e
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l22_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd144a977c21583d9cc1e1f0cf4960c7288cdf4f1c1a798f3fc97ff47952d694
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l23_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f17e98b589f47f9530cfd754472a3953ca790fbd2e60fa12766f35b420c2368d
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l2_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe23f5af252219bf430c8f9017e9f0136006a24354daef14ddd6feaccf1666f2
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l3_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1449c8aadc9f3f735cc6e4c1c7fc9d4777c4f2217da33a6b3145989beb575588
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l4_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:00d69fac32ba1bc654a2466ecd1fda2bc584f98f8da887584cfa79d4150c7b83
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l5_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5108c4cf6d94436bef0850a9c3292d5b2454fa729f52cccd63e4af53c91e9dd
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l6_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3ccb86670b27ac12fb320e016d7b713e3d822a073ba8bd6876365d9e10ec1b6
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l7_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a8d43fd1bbc8132d14cc2f22aa7e6edf8efb9906b46c81fe4333a923b2360e4
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l8_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71e8f81d7340b319d14bf842f9ea55c6de65f3ac20303e7e3dfe93798b66687d
|
| 3 |
+
size 11687781
|
Qwen2.5-0.5B-Instruct-GPTQ-Int4-context-2k-prefill-1500/qwen2_p128_l9_together.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d11985fc109897bfe8742f77610d0b84286183cd683b7af81a595605cebbd635
|
| 3 |
+
size 11687781
|