| { | |
| "dataset": "3b_val", | |
| "data_file": "data/3b_val.bin", | |
| "total_tokens": 75681623, | |
| "eval_tokens": 44965267, | |
| "max_tokens_used": 15000000, | |
| "perplexity": 5.709, | |
| "bits_per_token": 2.5132, | |
| "avg_nll": 1.742047, | |
| "elapsed_sec": 712.0, | |
| "config": { | |
| "seq_len": 2048, | |
| "stride": 512, | |
| "batch_size": 32, | |
| "dtype": "bfloat16" | |
| } | |
| } |