checkpoints / .gitattributes
tyzhu's picture
Add files using upload-large-folder tool
194dc22 verified
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
performance_plot.png filter=lfs diff=lfs merge=lfs -text
llama32-1b-hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
llama32-1b-hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__llama32-1b-hf/samples_gsm8k_2025-12-29T05-09-52.015180.jsonl filter=lfs diff=lfs merge=lfs -text
6000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
6000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__6000_hf/samples_gsm8k_2026-01-07T06-57-48.977156.jsonl filter=lfs diff=lfs merge=lfs -text
6000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__6000_hf/samples_hellaswag_2026-01-07T03-53-49.653886.jsonl filter=lfs diff=lfs merge=lfs -text
9000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
9000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__9000_hf/samples_gsm8k_2026-01-07T07-00-26.302516.jsonl filter=lfs diff=lfs merge=lfs -text
9000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__9000_hf/samples_hellaswag_2026-01-07T03-49-27.696211.jsonl filter=lfs diff=lfs merge=lfs -text
3000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
3000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_gsm8k_2026-01-07T07-15-16.192705.jsonl filter=lfs diff=lfs merge=lfs -text
3000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_gsm8k_2025-12-29T05-42-31.325047.jsonl filter=lfs diff=lfs merge=lfs -text
3000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_hellaswag_2026-01-07T03-56-25.245340.jsonl filter=lfs diff=lfs merge=lfs -text
3000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__3000_hf/samples_hellaswag_2025-12-29T05-34-35.086951.jsonl filter=lfs diff=lfs merge=lfs -text
7000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
7000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__7000_hf/samples_gsm8k_2026-01-07T07-00-36.377222.jsonl filter=lfs diff=lfs merge=lfs -text
7000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__7000_hf/samples_hellaswag_2026-01-07T03-51-33.637505.jsonl filter=lfs diff=lfs merge=lfs -text
2000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
2000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_gsm8k_2026-01-07T07-11-28.243760.jsonl filter=lfs diff=lfs merge=lfs -text
2000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_gsm8k_2025-12-29T05-42-21.185272.jsonl filter=lfs diff=lfs merge=lfs -text
2000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_hellaswag_2026-01-07T03-51-34.536241.jsonl filter=lfs diff=lfs merge=lfs -text
2000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2000_hf/samples_hellaswag_2025-12-29T05-34-34.282648.jsonl filter=lfs diff=lfs merge=lfs -text
12000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
12000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__12000_hf/samples_gsm8k_2026-01-07T07-12-50.487181.jsonl filter=lfs diff=lfs merge=lfs -text
12000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__12000_hf/samples_hellaswag_2026-01-07T03-56-25.498160.jsonl filter=lfs diff=lfs merge=lfs -text
8000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
8000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__8000_hf/samples_gsm8k_2026-01-07T07-00-06.652270.jsonl filter=lfs diff=lfs merge=lfs -text
8000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__8000_hf/samples_hellaswag_2026-01-07T03-53-44.066877.jsonl filter=lfs diff=lfs merge=lfs -text
11000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
11000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__11000_hf/samples_gsm8k_2026-01-07T07-13-06.183388.jsonl filter=lfs diff=lfs merge=lfs -text
11000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__11000_hf/samples_hellaswag_2026-01-07T03-51-33.854124.jsonl filter=lfs diff=lfs merge=lfs -text
1000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_gsm8k_2025-12-29T05-42-28.885838.jsonl filter=lfs diff=lfs merge=lfs -text
1000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_gsm8k_2026-01-07T07-13-27.882882.jsonl filter=lfs diff=lfs merge=lfs -text
1000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_hellaswag_2026-01-07T03-57-52.654434.jsonl filter=lfs diff=lfs merge=lfs -text
1000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__1000_hf/samples_hellaswag_2025-12-29T05-34-34.847641.jsonl filter=lfs diff=lfs merge=lfs -text
4000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
4000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_gsm8k_2026-01-07T06-59-35.025159.jsonl filter=lfs diff=lfs merge=lfs -text
4000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_gsm8k_2025-12-29T05-42-32.998053.jsonl filter=lfs diff=lfs merge=lfs -text
4000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_hellaswag_2025-12-29T05-33-51.606131.jsonl filter=lfs diff=lfs merge=lfs -text
4000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__4000_hf/samples_hellaswag_2026-01-07T03-56-26.179191.jsonl filter=lfs diff=lfs merge=lfs -text
2500_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
2500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_gsm8k_2025-12-29T05-42-37.282529.jsonl filter=lfs diff=lfs merge=lfs -text
2500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_gsm8k_2026-01-07T07-15-20.052939.jsonl filter=lfs diff=lfs merge=lfs -text
2500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_hellaswag_2026-01-07T03-51-34.430609.jsonl filter=lfs diff=lfs merge=lfs -text
2500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__2500_hf/samples_hellaswag_2025-12-29T05-34-34.570482.jsonl filter=lfs diff=lfs merge=lfs -text
10000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
10000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__10000_hf/samples_gsm8k_2026-01-07T07-13-00.293068.jsonl filter=lfs diff=lfs merge=lfs -text
10000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__10000_hf/samples_hellaswag_2026-01-07T03-56-14.560763.jsonl filter=lfs diff=lfs merge=lfs -text
12500_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
12500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__12500_hf/samples_gsm8k_2026-01-07T07-12-17.705915.jsonl filter=lfs diff=lfs merge=lfs -text
12500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__12500_hf/samples_hellaswag_2026-01-07T03-51-35.016035.jsonl filter=lfs diff=lfs merge=lfs -text
5000_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
5000_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__5000_hf/samples_gsm8k_2026-01-07T06-58-05.968321.jsonl filter=lfs diff=lfs merge=lfs -text
5000_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__5000_hf/samples_hellaswag_2026-01-07T03-53-49.355990.jsonl filter=lfs diff=lfs merge=lfs -text
7500_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
7500_hf/harness_eval_8shot/__home__aiops__zhuty__nanotron__checkpoints__7500_hf/samples_gsm8k_2026-01-07T07-00-15.435455.jsonl filter=lfs diff=lfs merge=lfs -text
7500_hf/harness_eval_0shot/__home__aiops__zhuty__nanotron__checkpoints__7500_hf/samples_hellaswag_2026-01-07T03-51-34.104451.jsonl filter=lfs diff=lfs merge=lfs -text