Update README.md
Browse files
README.md
CHANGED
|
@@ -10,9 +10,12 @@ library_name: transformers
|
|
| 10 |
license: mit
|
| 11 |
pipeline_tag: text-generation
|
| 12 |
---
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
|
|
|
|
|
|
|
|
|
| 16 |
|
| 17 |
<div>
|
| 18 |
<p style="margin-top: 0;margin-bottom: 0;">
|
|
@@ -25,13 +28,12 @@ pipeline_tag: text-generation
|
|
| 25 |
<a href="https://discord.gg/unsloth">
|
| 26 |
<img src="https://github.com/unslothai/unsloth/raw/main/images/Discord%20button.png" width="173">
|
| 27 |
</a>
|
| 28 |
-
<a href="https://
|
| 29 |
<img src="https://raw.githubusercontent.com/unslothai/unsloth/refs/heads/main/images/documentation%20green%20button.png" width="143">
|
| 30 |
</a>
|
| 31 |
</div>
|
| 32 |
</div>
|
| 33 |
|
| 34 |
-
|
| 35 |
# GLM-4.7-Flash
|
| 36 |
|
| 37 |
<div align="center">
|
|
|
|
| 10 |
license: mit
|
| 11 |
pipeline_tag: text-generation
|
| 12 |
---
|
| 13 |
+
# Read our How to [Run FP8 GLM-4.7-Flash Guide!](https://unsloth.ai/docs/models/glm-4.7-flash#glm-4.7-flash-in-vllm)
|
| 14 |
+
|
| 15 |
+
## FP8 Dynamically quantized GLM-4.7-Flash
|
| 16 |
+
FP8 Dynamically quantized by Unsloth for fast and premium inference.<br>You can read our [vLLM deployment guide](https://unsloth.ai/docs/models/glm-4.7-flash#glm-4.7-flash-in-vllm).
|
| 17 |
+
|
| 18 |
+
---
|
| 19 |
|
| 20 |
<div>
|
| 21 |
<p style="margin-top: 0;margin-bottom: 0;">
|
|
|
|
| 28 |
<a href="https://discord.gg/unsloth">
|
| 29 |
<img src="https://github.com/unslothai/unsloth/raw/main/images/Discord%20button.png" width="173">
|
| 30 |
</a>
|
| 31 |
+
<a href="https://unsloth.ai/docs/models/glm-4.7-flash">
|
| 32 |
<img src="https://raw.githubusercontent.com/unslothai/unsloth/refs/heads/main/images/documentation%20green%20button.png" width="143">
|
| 33 |
</a>
|
| 34 |
</div>
|
| 35 |
</div>
|
| 36 |
|
|
|
|
| 37 |
# GLM-4.7-Flash
|
| 38 |
|
| 39 |
<div align="center">
|