{ "epoch": 20.0, "num_input_tokens_seen": 564096, "total_flos": 2.5450673718951936e+16, "train_loss": 0.018261103643923585, "train_runtime": 415.2132, "train_samples_per_second": 17.34, "train_steps_per_second": 4.335 }