R1-Distill-Llama-8B-SFT-cotroller_dataset-bespoke-17k-llama3-hehe-ta_and_ps-train-v2
/
train_results.json
| { | |
| "epoch": 5.0, | |
| "total_flos": 7.246507712740065e+17, | |
| "train_loss": 0.08232667656972054, | |
| "train_runtime": 8410.3038, | |
| "train_samples": 23594, | |
| "train_samples_per_second": 1.787, | |
| "train_steps_per_second": 0.056 | |
| } |