| [ | |
| { | |
| "loss": 0.8685, | |
| "grad_norm": 3.481233835220337, | |
| "learning_rate": 9.900000000000002e-06, | |
| "epoch": 0.7092198581560284, | |
| "step": 100 | |
| }, | |
| { | |
| "eval_loss": 0.2325897216796875, | |
| "eval_accuracy": 0.9201523930470672, | |
| "eval_f1": 0.717974180734856, | |
| "eval_runtime": 3.2063, | |
| "eval_samples_per_second": 174.345, | |
| "eval_steps_per_second": 5.614, | |
| "epoch": 1.0, | |
| "step": 141 | |
| }, | |
| { | |
| "loss": 0.2274, | |
| "grad_norm": 1.5385990142822266, | |
| "learning_rate": 1.9900000000000003e-05, | |
| "epoch": 1.4184397163120568, | |
| "step": 200 | |
| }, | |
| { | |
| "eval_loss": 0.14628532528877258, | |
| "eval_accuracy": 0.9490435748868958, | |
| "eval_f1": 0.8258811152025249, | |
| "eval_runtime": 3.1326, | |
| "eval_samples_per_second": 178.447, | |
| "eval_steps_per_second": 5.746, | |
| "epoch": 2.0, | |
| "step": 282 | |
| }, | |
| { | |
| "loss": 0.1409, | |
| "grad_norm": 1.131034016609192, | |
| "learning_rate": 2.9900000000000002e-05, | |
| "epoch": 2.127659574468085, | |
| "step": 300 | |
| }, | |
| { | |
| "loss": 0.1162, | |
| "grad_norm": 1.4681241512298584, | |
| "learning_rate": 3.99e-05, | |
| "epoch": 2.8368794326241136, | |
| "step": 400 | |
| }, | |
| { | |
| "eval_loss": 0.16565711796283722, | |
| "eval_accuracy": 0.9450750059528534, | |
| "eval_f1": 0.8205513784461153, | |
| "eval_runtime": 3.1398, | |
| "eval_samples_per_second": 178.04, | |
| "eval_steps_per_second": 5.733, | |
| "epoch": 3.0, | |
| "step": 423 | |
| }, | |
| { | |
| "train_runtime": 218.6651, | |
| "train_samples_per_second": 61.491, | |
| "train_steps_per_second": 1.934, | |
| "total_flos": 878380812168192.0, | |
| "train_loss": 0.3254874164049225, | |
| "epoch": 3.0, | |
| "step": 423 | |
| }, | |
| { | |
| "eval_loss": 0.12958413362503052, | |
| "eval_accuracy": 0.9540563620836892, | |
| "eval_f1": 0.8495117748420448, | |
| "eval_runtime": 3.1102, | |
| "eval_samples_per_second": 179.087, | |
| "eval_steps_per_second": 5.787, | |
| "epoch": 3.0, | |
| "step": 423 | |
| } | |
| ] |