TinyStories: How Small Can Language Models Be and Still Speak Coherent English?
Paper
•
2305.07759
•
Published
•
38
A transformer language model trained on the TinyStories dataset.
import torch
from cs336_basics.transformer import Transformer
# Load model
model = Transformer(...) # Configure with parameters above
checkpoint = torch.load("pytorch_model.bin")
model.load_state_dict(checkpoint)
# Generate text
# (Add your inference code here)
@misc{tinystories_transformer_80M},
author = {ashishshroti14},
title = {tinystories-transformer-80M},
year = {2025},
publisher = {HuggingFace},
url = {https://huggingface.co/ashishshroti14/tinystories-transformer-80M}
}
@article{eldan2023tinystories,
title={TinyStories: How Small Can Language Models Be and Still Speak Coherent English?},
author={Eldan, Ronen and Li, Yuanzhi},
journal={arXiv preprint arXiv:2305.07759},
year={2023}
}