Update README.md
Browse files
README.md
CHANGED
|
@@ -8,10 +8,14 @@ tags:
|
|
| 8 |
- mixture-of-experts
|
| 9 |
- autoregressive
|
| 10 |
- text-generation
|
|
|
|
|
|
|
| 11 |
datasets:
|
| 12 |
- HuggingFaceFW/fineweb-edu
|
| 13 |
pipeline_tag: text-generation
|
| 14 |
library_name: pytorch
|
|
|
|
|
|
|
| 15 |
---
|
| 16 |
|
| 17 |
# HSSM
|
|
@@ -185,4 +189,4 @@ print(reply)
|
|
| 185 |
|
| 186 |
## Citation
|
| 187 |
|
| 188 |
-
If you use this release in experiments, please cite the model repository and mention the FineWeb-Edu pretraining source.
|
|
|
|
| 8 |
- mixture-of-experts
|
| 9 |
- autoregressive
|
| 10 |
- text-generation
|
| 11 |
+
- 73.8 M
|
| 12 |
+
- pretrained
|
| 13 |
datasets:
|
| 14 |
- HuggingFaceFW/fineweb-edu
|
| 15 |
pipeline_tag: text-generation
|
| 16 |
library_name: pytorch
|
| 17 |
+
model_type: custom
|
| 18 |
+
license: mit
|
| 19 |
---
|
| 20 |
|
| 21 |
# HSSM
|
|
|
|
| 189 |
|
| 190 |
## Citation
|
| 191 |
|
| 192 |
+
If you use this release in experiments, please cite the model repository and mention the FineWeb-Edu pretraining source.
|