| time,step,epoch,loss,grad_norm,learning_rate,eval_loss,eval_accuracy,eval_f1_macro,eval_runtime,eval_samples_per_second,eval_steps_per_second,train_runtime,train_samples_per_second,train_steps_per_second,total_flos,train_loss | |
| 1772621239.9061947,3594,1.0,0.22125994767755286,6.724055290222168,1.5005564830272678e-05,,,,,,,,,,, | |
| 1772621313.7196841,3594,1.0,,,,0.172308087348938,0.939,0.9385995315324059,73.7663,67.782,2.128,,,,, | |
| 1772622076.1915433,7188,2.0,0.1287970014857662,6.3051323890686035,1.0008347245409015e-05,,,,,,,,,,, | |
| 1772622142.2857678,7188,2.0,,,,0.17122335731983185,0.9456,0.9452690872397813,66.0787,75.667,2.376,,,,, | |
| 1772622925.8879561,10782,3.0,0.08359225723699655,0.1423230767250061,5.008347245409015e-06,,,,,,,,,,, | |
| 1772622993.8675847,10782,3.0,,,,0.19895857572555542,0.9478,0.9473008374036693,67.9671,73.565,2.31,,,,, | |
| 1772623793.07226,14376,4.0,0.05389018369238444,3.4260194301605225,1.1129660545353369e-08,,,,,,,,,,, | |
| 1772623859.575091,14376,4.0,,,,0.23433832824230194,0.946,0.9456142780018644,66.4875,75.202,2.361,,,,, | |
| 1772623863.9921458,14376,4.0,,,,,,,,,,3435.1438,133.91,4.185,2.475637874594976e+16,0.12188484752317502 | |