| *.7z filter=lfs diff=lfs merge=lfs -text |
| *.arrow filter=lfs diff=lfs merge=lfs -text |
| *.bin filter=lfs diff=lfs merge=lfs -text |
| *.bz2 filter=lfs diff=lfs merge=lfs -text |
| *.ckpt filter=lfs diff=lfs merge=lfs -text |
| *.ftz filter=lfs diff=lfs merge=lfs -text |
| *.gz filter=lfs diff=lfs merge=lfs -text |
| *.h5 filter=lfs diff=lfs merge=lfs -text |
| *.joblib filter=lfs diff=lfs merge=lfs -text |
| *.lfs.* filter=lfs diff=lfs merge=lfs -text |
| *.mlmodel filter=lfs diff=lfs merge=lfs -text |
| *.model filter=lfs diff=lfs merge=lfs -text |
| *.msgpack filter=lfs diff=lfs merge=lfs -text |
| *.npy filter=lfs diff=lfs merge=lfs -text |
| *.npz filter=lfs diff=lfs merge=lfs -text |
| *.onnx filter=lfs diff=lfs merge=lfs -text |
| *.ot filter=lfs diff=lfs merge=lfs -text |
| *.parquet filter=lfs diff=lfs merge=lfs -text |
| *.pb filter=lfs diff=lfs merge=lfs -text |
| *.pickle filter=lfs diff=lfs merge=lfs -text |
| *.pkl filter=lfs diff=lfs merge=lfs -text |
| *.pt filter=lfs diff=lfs merge=lfs -text |
| *.pth filter=lfs diff=lfs merge=lfs -text |
| *.rar filter=lfs diff=lfs merge=lfs -text |
| *.safetensors filter=lfs diff=lfs merge=lfs -text |
| saved_model/**/* filter=lfs diff=lfs merge=lfs -text |
| *.tar.* filter=lfs diff=lfs merge=lfs -text |
| *.tar filter=lfs diff=lfs merge=lfs -text |
| *.tflite filter=lfs diff=lfs merge=lfs -text |
| *.tgz filter=lfs diff=lfs merge=lfs -text |
| *.wasm filter=lfs diff=lfs merge=lfs -text |
| *.xz filter=lfs diff=lfs merge=lfs -text |
| *.zip filter=lfs diff=lfs merge=lfs -text |
| *.zst filter=lfs diff=lfs merge=lfs -text |
| *tfevents* filter=lfs diff=lfs merge=lfs -text |
| performance_plot.png filter=lfs diff=lfs merge=lfs -text |
| llama32-1b-hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| llama32-1b-hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__llama32-1b-hf/samples_gsm8k_2025-12-29T05-09-52.015180.jsonl filter=lfs diff=lfs merge=lfs -text |
| 6000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 6000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__6000_hf/samples_gsm8k_2026-01-07T06-57-48.977156.jsonl filter=lfs diff=lfs merge=lfs -text |
| 6000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__6000_hf/samples_hellaswag_2026-01-07T03-53-49.653886.jsonl filter=lfs diff=lfs merge=lfs -text |
| 9000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 9000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__9000_hf/samples_gsm8k_2026-01-07T07-00-26.302516.jsonl filter=lfs diff=lfs merge=lfs -text |
| 9000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__9000_hf/samples_hellaswag_2026-01-07T03-49-27.696211.jsonl filter=lfs diff=lfs merge=lfs -text |
| 3000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 3000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_gsm8k_2026-01-07T07-15-16.192705.jsonl filter=lfs diff=lfs merge=lfs -text |
| 3000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_gsm8k_2025-12-29T05-42-31.325047.jsonl filter=lfs diff=lfs merge=lfs -text |
| 3000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_hellaswag_2026-01-07T03-56-25.245340.jsonl filter=lfs diff=lfs merge=lfs -text |
| 3000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_hellaswag_2025-12-29T05-34-35.086951.jsonl filter=lfs diff=lfs merge=lfs -text |
| 7000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 7000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__7000_hf/samples_gsm8k_2026-01-07T07-00-36.377222.jsonl filter=lfs diff=lfs merge=lfs -text |
| 7000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__7000_hf/samples_hellaswag_2026-01-07T03-51-33.637505.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 2000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_gsm8k_2026-01-07T07-11-28.243760.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_gsm8k_2025-12-29T05-42-21.185272.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_hellaswag_2026-01-07T03-51-34.536241.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_hellaswag_2025-12-29T05-34-34.282648.jsonl filter=lfs diff=lfs merge=lfs -text |
| 12000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 12000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__12000_hf/samples_gsm8k_2026-01-07T07-12-50.487181.jsonl filter=lfs diff=lfs merge=lfs -text |
| 12000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__12000_hf/samples_hellaswag_2026-01-07T03-56-25.498160.jsonl filter=lfs diff=lfs merge=lfs -text |
| 8000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 8000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__8000_hf/samples_gsm8k_2026-01-07T07-00-06.652270.jsonl filter=lfs diff=lfs merge=lfs -text |
| 8000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__8000_hf/samples_hellaswag_2026-01-07T03-53-44.066877.jsonl filter=lfs diff=lfs merge=lfs -text |
| 11000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 11000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__11000_hf/samples_gsm8k_2026-01-07T07-13-06.183388.jsonl filter=lfs diff=lfs merge=lfs -text |
| 11000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__11000_hf/samples_hellaswag_2026-01-07T03-51-33.854124.jsonl filter=lfs diff=lfs merge=lfs -text |
| 1000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 1000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_gsm8k_2025-12-29T05-42-28.885838.jsonl filter=lfs diff=lfs merge=lfs -text |
| 1000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_gsm8k_2026-01-07T07-13-27.882882.jsonl filter=lfs diff=lfs merge=lfs -text |
| 1000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_hellaswag_2026-01-07T03-57-52.654434.jsonl filter=lfs diff=lfs merge=lfs -text |
| 1000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_hellaswag_2025-12-29T05-34-34.847641.jsonl filter=lfs diff=lfs merge=lfs -text |
| 4000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 4000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_gsm8k_2026-01-07T06-59-35.025159.jsonl filter=lfs diff=lfs merge=lfs -text |
| 4000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_gsm8k_2025-12-29T05-42-32.998053.jsonl filter=lfs diff=lfs merge=lfs -text |
| 4000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_hellaswag_2025-12-29T05-33-51.606131.jsonl filter=lfs diff=lfs merge=lfs -text |
| 4000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_hellaswag_2026-01-07T03-56-26.179191.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2500_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 2500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_gsm8k_2025-12-29T05-42-37.282529.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_gsm8k_2026-01-07T07-15-20.052939.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_hellaswag_2026-01-07T03-51-34.430609.jsonl filter=lfs diff=lfs merge=lfs -text |
| 2500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_hellaswag_2025-12-29T05-34-34.570482.jsonl filter=lfs diff=lfs merge=lfs -text |
| 10000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 10000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__10000_hf/samples_gsm8k_2026-01-07T07-13-00.293068.jsonl filter=lfs diff=lfs merge=lfs -text |
| 10000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__10000_hf/samples_hellaswag_2026-01-07T03-56-14.560763.jsonl filter=lfs diff=lfs merge=lfs -text |
| 12500_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 12500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__12500_hf/samples_gsm8k_2026-01-07T07-12-17.705915.jsonl filter=lfs diff=lfs merge=lfs -text |
| 12500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__12500_hf/samples_hellaswag_2026-01-07T03-51-35.016035.jsonl filter=lfs diff=lfs merge=lfs -text |
| 5000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 5000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__5000_hf/samples_gsm8k_2026-01-07T06-58-05.968321.jsonl filter=lfs diff=lfs merge=lfs -text |
| 5000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__5000_hf/samples_hellaswag_2026-01-07T03-53-49.355990.jsonl filter=lfs diff=lfs merge=lfs -text |
| 7500_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text |
| 7500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__7500_hf/samples_gsm8k_2026-01-07T07-00-15.435455.jsonl filter=lfs diff=lfs merge=lfs -text |
| 7500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__7500_hf/samples_hellaswag_2026-01-07T03-51-34.104451.jsonl filter=lfs diff=lfs merge=lfs -text |
|
|