| { | |
| "best_metric": 0.8596623807901907, | |
| "best_model_checkpoint": "./save_models/mrpc/roberta-base_lr5e-05_run0/checkpoint-1449", | |
| "epoch": 10.0, | |
| "eval_steps": 500, | |
| "global_step": 2070, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.8010899182561307, | |
| "eval_averaged_scores": 0.8262068735883505, | |
| "eval_f1": 0.8513238289205703, | |
| "eval_loss": 0.4088594615459442, | |
| "eval_runtime": 0.8357, | |
| "eval_samples_per_second": 439.143, | |
| "eval_steps_per_second": 27.521, | |
| "step": 207 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.7602179836512262, | |
| "eval_averaged_scores": 0.781009892726514, | |
| "eval_f1": 0.8018018018018018, | |
| "eval_loss": 0.4726070165634155, | |
| "eval_runtime": 0.4955, | |
| "eval_samples_per_second": 740.675, | |
| "eval_steps_per_second": 46.418, | |
| "step": 414 | |
| }, | |
| { | |
| "epoch": 2.42, | |
| "learning_rate": 4.0359897172236504e-05, | |
| "loss": 0.4481, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.8283378746594006, | |
| "eval_averaged_scores": 0.8527654285577706, | |
| "eval_f1": 0.8771929824561405, | |
| "eval_loss": 0.46944934129714966, | |
| "eval_runtime": 0.4861, | |
| "eval_samples_per_second": 754.978, | |
| "eval_steps_per_second": 47.315, | |
| "step": 621 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.8365122615803815, | |
| "eval_averaged_scores": 0.8587323212663813, | |
| "eval_f1": 0.880952380952381, | |
| "eval_loss": 0.716332197189331, | |
| "eval_runtime": 0.4857, | |
| "eval_samples_per_second": 755.614, | |
| "eval_steps_per_second": 47.355, | |
| "step": 828 | |
| }, | |
| { | |
| "epoch": 4.83, | |
| "learning_rate": 2.750642673521851e-05, | |
| "loss": 0.2017, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.8283378746594006, | |
| "eval_averaged_scores": 0.8510426848246903, | |
| "eval_f1": 0.87374749498998, | |
| "eval_loss": 0.9263336658477783, | |
| "eval_runtime": 0.4853, | |
| "eval_samples_per_second": 756.307, | |
| "eval_steps_per_second": 47.398, | |
| "step": 1035 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.8283378746594006, | |
| "eval_averaged_scores": 0.8510426848246903, | |
| "eval_f1": 0.87374749498998, | |
| "eval_loss": 1.0142543315887451, | |
| "eval_runtime": 0.4866, | |
| "eval_samples_per_second": 754.169, | |
| "eval_steps_per_second": 47.264, | |
| "step": 1242 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.8365122615803815, | |
| "eval_averaged_scores": 0.8596623807901907, | |
| "eval_f1": 0.8828125, | |
| "eval_loss": 1.0171551704406738, | |
| "eval_runtime": 0.4871, | |
| "eval_samples_per_second": 753.373, | |
| "eval_steps_per_second": 47.214, | |
| "step": 1449 | |
| }, | |
| { | |
| "epoch": 7.25, | |
| "learning_rate": 1.4652956298200515e-05, | |
| "loss": 0.0593, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.8337874659400545, | |
| "eval_averaged_scores": 0.8557714884810492, | |
| "eval_f1": 0.8777555110220441, | |
| "eval_loss": 1.0489568710327148, | |
| "eval_runtime": 0.4847, | |
| "eval_samples_per_second": 757.236, | |
| "eval_steps_per_second": 47.456, | |
| "step": 1656 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.8337874659400545, | |
| "eval_averaged_scores": 0.8569723184317168, | |
| "eval_f1": 0.8801571709233792, | |
| "eval_loss": 1.2099965810775757, | |
| "eval_runtime": 0.4891, | |
| "eval_samples_per_second": 750.402, | |
| "eval_steps_per_second": 47.028, | |
| "step": 1863 | |
| }, | |
| { | |
| "epoch": 9.66, | |
| "learning_rate": 1.7994858611825194e-06, | |
| "loss": 0.0183, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.8310626702997275, | |
| "eval_averaged_scores": 0.8542665130154764, | |
| "eval_f1": 0.8774703557312253, | |
| "eval_loss": 1.2079670429229736, | |
| "eval_runtime": 0.4843, | |
| "eval_samples_per_second": 757.767, | |
| "eval_steps_per_second": 47.489, | |
| "step": 2070 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 2070, | |
| "total_flos": 1295111753354040.0, | |
| "train_loss": 0.17568344080523737, | |
| "train_runtime": 279.1119, | |
| "train_samples_per_second": 118.268, | |
| "train_steps_per_second": 7.416 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 2070, | |
| "num_train_epochs": 10, | |
| "save_steps": 500, | |
| "total_flos": 1295111753354040.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |