{ "best_metric": 0.8596623807901907, "best_model_checkpoint": "./save_models/mrpc/roberta-base_lr5e-05_run0/checkpoint-1449", "epoch": 10.0, "eval_steps": 500, "global_step": 2070, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.8010899182561307, "eval_averaged_scores": 0.8262068735883505, "eval_f1": 0.8513238289205703, "eval_loss": 0.4088594615459442, "eval_runtime": 0.8357, "eval_samples_per_second": 439.143, "eval_steps_per_second": 27.521, "step": 207 }, { "epoch": 2.0, "eval_accuracy": 0.7602179836512262, "eval_averaged_scores": 0.781009892726514, "eval_f1": 0.8018018018018018, "eval_loss": 0.4726070165634155, "eval_runtime": 0.4955, "eval_samples_per_second": 740.675, "eval_steps_per_second": 46.418, "step": 414 }, { "epoch": 2.42, "learning_rate": 4.0359897172236504e-05, "loss": 0.4481, "step": 500 }, { "epoch": 3.0, "eval_accuracy": 0.8283378746594006, "eval_averaged_scores": 0.8527654285577706, "eval_f1": 0.8771929824561405, "eval_loss": 0.46944934129714966, "eval_runtime": 0.4861, "eval_samples_per_second": 754.978, "eval_steps_per_second": 47.315, "step": 621 }, { "epoch": 4.0, "eval_accuracy": 0.8365122615803815, "eval_averaged_scores": 0.8587323212663813, "eval_f1": 0.880952380952381, "eval_loss": 0.716332197189331, "eval_runtime": 0.4857, "eval_samples_per_second": 755.614, "eval_steps_per_second": 47.355, "step": 828 }, { "epoch": 4.83, "learning_rate": 2.750642673521851e-05, "loss": 0.2017, "step": 1000 }, { "epoch": 5.0, "eval_accuracy": 0.8283378746594006, "eval_averaged_scores": 0.8510426848246903, "eval_f1": 0.87374749498998, "eval_loss": 0.9263336658477783, "eval_runtime": 0.4853, "eval_samples_per_second": 756.307, "eval_steps_per_second": 47.398, "step": 1035 }, { "epoch": 6.0, "eval_accuracy": 0.8283378746594006, "eval_averaged_scores": 0.8510426848246903, "eval_f1": 0.87374749498998, "eval_loss": 1.0142543315887451, "eval_runtime": 0.4866, "eval_samples_per_second": 754.169, "eval_steps_per_second": 47.264, "step": 1242 }, { "epoch": 7.0, "eval_accuracy": 0.8365122615803815, "eval_averaged_scores": 0.8596623807901907, "eval_f1": 0.8828125, "eval_loss": 1.0171551704406738, "eval_runtime": 0.4871, "eval_samples_per_second": 753.373, "eval_steps_per_second": 47.214, "step": 1449 }, { "epoch": 7.25, "learning_rate": 1.4652956298200515e-05, "loss": 0.0593, "step": 1500 }, { "epoch": 8.0, "eval_accuracy": 0.8337874659400545, "eval_averaged_scores": 0.8557714884810492, "eval_f1": 0.8777555110220441, "eval_loss": 1.0489568710327148, "eval_runtime": 0.4847, "eval_samples_per_second": 757.236, "eval_steps_per_second": 47.456, "step": 1656 }, { "epoch": 9.0, "eval_accuracy": 0.8337874659400545, "eval_averaged_scores": 0.8569723184317168, "eval_f1": 0.8801571709233792, "eval_loss": 1.2099965810775757, "eval_runtime": 0.4891, "eval_samples_per_second": 750.402, "eval_steps_per_second": 47.028, "step": 1863 }, { "epoch": 9.66, "learning_rate": 1.7994858611825194e-06, "loss": 0.0183, "step": 2000 }, { "epoch": 10.0, "eval_accuracy": 0.8310626702997275, "eval_averaged_scores": 0.8542665130154764, "eval_f1": 0.8774703557312253, "eval_loss": 1.2079670429229736, "eval_runtime": 0.4843, "eval_samples_per_second": 757.767, "eval_steps_per_second": 47.489, "step": 2070 }, { "epoch": 10.0, "step": 2070, "total_flos": 1295111753354040.0, "train_loss": 0.17568344080523737, "train_runtime": 279.1119, "train_samples_per_second": 118.268, "train_steps_per_second": 7.416 } ], "logging_steps": 500, "max_steps": 2070, "num_train_epochs": 10, "save_steps": 500, "total_flos": 1295111753354040.0, "trial_name": null, "trial_params": null }