| { | |
| "best_metric": 0.8970588235294118, | |
| "best_model_checkpoint": "./bert-base-uncased/fine_tuned_models/checkpoint-575", | |
| "epoch": 10.0, | |
| "global_step": 1150, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 1e-05, | |
| "loss": 0.6336, | |
| "step": 115 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.6838235294117647, | |
| "eval_combined_score": 0.7480253018237863, | |
| "eval_f1": 0.8122270742358079, | |
| "eval_loss": 0.538364589214325, | |
| "eval_runtime": 1.089, | |
| "eval_samples_per_second": 374.663, | |
| "eval_steps_per_second": 46.833, | |
| "step": 115 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 2e-05, | |
| "loss": 0.482, | |
| "step": 230 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.8357843137254902, | |
| "eval_combined_score": 0.8625202560362988, | |
| "eval_f1": 0.8892561983471075, | |
| "eval_loss": 0.40759965777397156, | |
| "eval_runtime": 1.0806, | |
| "eval_samples_per_second": 377.572, | |
| "eval_steps_per_second": 47.196, | |
| "step": 230 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 1.7500000000000002e-05, | |
| "loss": 0.3576, | |
| "step": 345 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.875, | |
| "eval_combined_score": 0.8912205081669691, | |
| "eval_f1": 0.9074410163339381, | |
| "eval_loss": 0.2955787181854248, | |
| "eval_runtime": 1.0806, | |
| "eval_samples_per_second": 377.557, | |
| "eval_steps_per_second": 47.195, | |
| "step": 345 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 1.5000000000000002e-05, | |
| "loss": 0.2205, | |
| "step": 460 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.8921568627450981, | |
| "eval_combined_score": 0.9076168929110106, | |
| "eval_f1": 0.923076923076923, | |
| "eval_loss": 0.3020019829273224, | |
| "eval_runtime": 1.0822, | |
| "eval_samples_per_second": 376.994, | |
| "eval_steps_per_second": 47.124, | |
| "step": 460 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 1.25e-05, | |
| "loss": 0.1258, | |
| "step": 575 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.8970588235294118, | |
| "eval_combined_score": 0.9106232745805904, | |
| "eval_f1": 0.924187725631769, | |
| "eval_loss": 0.3507114052772522, | |
| "eval_runtime": 1.0903, | |
| "eval_samples_per_second": 374.196, | |
| "eval_steps_per_second": 46.775, | |
| "step": 575 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0893, | |
| "step": 690 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.8848039215686274, | |
| "eval_combined_score": 0.8994403520091766, | |
| "eval_f1": 0.9140767824497258, | |
| "eval_loss": 0.46679043769836426, | |
| "eval_runtime": 1.0897, | |
| "eval_samples_per_second": 374.408, | |
| "eval_steps_per_second": 46.801, | |
| "step": 690 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "learning_rate": 7.500000000000001e-06, | |
| "loss": 0.0635, | |
| "step": 805 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.8921568627450981, | |
| "eval_combined_score": 0.906510086048808, | |
| "eval_f1": 0.9208633093525179, | |
| "eval_loss": 0.5193934440612793, | |
| "eval_runtime": 1.1035, | |
| "eval_samples_per_second": 369.736, | |
| "eval_steps_per_second": 46.217, | |
| "step": 805 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 5e-06, | |
| "loss": 0.0391, | |
| "step": 920 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.8897058823529411, | |
| "eval_combined_score": 0.9040180954414434, | |
| "eval_f1": 0.9183303085299456, | |
| "eval_loss": 0.642646312713623, | |
| "eval_runtime": 1.0978, | |
| "eval_samples_per_second": 371.638, | |
| "eval_steps_per_second": 46.455, | |
| "step": 920 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "learning_rate": 2.5e-06, | |
| "loss": 0.0294, | |
| "step": 1035 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.8848039215686274, | |
| "eval_combined_score": 0.9003626047914693, | |
| "eval_f1": 0.9159212880143113, | |
| "eval_loss": 0.6596136689186096, | |
| "eval_runtime": 1.1007, | |
| "eval_samples_per_second": 370.671, | |
| "eval_steps_per_second": 46.334, | |
| "step": 1035 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "learning_rate": 0.0, | |
| "loss": 0.0163, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.8921568627450981, | |
| "eval_combined_score": 0.9063672400368089, | |
| "eval_f1": 0.9205776173285197, | |
| "eval_loss": 0.6627745628356934, | |
| "eval_runtime": 1.1037, | |
| "eval_samples_per_second": 369.676, | |
| "eval_steps_per_second": 46.209, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 1150, | |
| "total_flos": 2412728377651200.0, | |
| "train_loss": 0.20570029414218405, | |
| "train_runtime": 332.3723, | |
| "train_samples_per_second": 110.358, | |
| "train_steps_per_second": 3.46 | |
| } | |
| ], | |
| "max_steps": 1150, | |
| "num_train_epochs": 10, | |
| "total_flos": 2412728377651200.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |