{ "best_metric": 0.8897058823529411, "best_model_checkpoint": "./bert-base-uncased/fine_tuned_models/checkpoint-1725", "epoch": 20.0, "global_step": 2300, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 1e-05, "loss": 0.6358, "step": 115 }, { "epoch": 1.0, "eval_accuracy": 0.7009803921568627, "eval_combined_score": 0.7599857450398557, "eval_f1": 0.8189910979228486, "eval_loss": 0.5365363359451294, "eval_runtime": 1.8712, "eval_samples_per_second": 218.045, "eval_steps_per_second": 27.256, "step": 115 }, { "epoch": 2.0, "learning_rate": 2e-05, "loss": 0.4545, "step": 230 }, { "epoch": 2.0, "eval_accuracy": 0.8161764705882353, "eval_combined_score": 0.84750665209541, "eval_f1": 0.8788368336025848, "eval_loss": 0.41578346490859985, "eval_runtime": 1.8846, "eval_samples_per_second": 216.486, "eval_steps_per_second": 27.061, "step": 230 }, { "epoch": 3.0, "learning_rate": 1.888888888888889e-05, "loss": 0.2835, "step": 345 }, { "epoch": 3.0, "eval_accuracy": 0.8823529411764706, "eval_combined_score": 0.8995098039215687, "eval_f1": 0.9166666666666667, "eval_loss": 0.3312576413154602, "eval_runtime": 1.8685, "eval_samples_per_second": 218.351, "eval_steps_per_second": 27.294, "step": 345 }, { "epoch": 4.0, "learning_rate": 1.7777777777777777e-05, "loss": 0.1495, "step": 460 }, { "epoch": 4.0, "eval_accuracy": 0.8725490196078431, "eval_combined_score": 0.891446923597025, "eval_f1": 0.9103448275862069, "eval_loss": 0.4420200288295746, "eval_runtime": 1.8756, "eval_samples_per_second": 217.526, "eval_steps_per_second": 27.191, "step": 460 }, { "epoch": 5.0, "learning_rate": 1.6666666666666667e-05, "loss": 0.103, "step": 575 }, { "epoch": 5.0, "eval_accuracy": 0.8676470588235294, "eval_combined_score": 0.8840080312567832, "eval_f1": 0.9003690036900369, "eval_loss": 0.5437020063400269, "eval_runtime": 1.8749, "eval_samples_per_second": 217.61, "eval_steps_per_second": 27.201, "step": 575 }, { "epoch": 6.0, "learning_rate": 1.555555555555556e-05, "loss": 0.0683, "step": 690 }, { "epoch": 6.0, "eval_accuracy": 0.8627450980392157, "eval_combined_score": 0.8835909790537375, "eval_f1": 0.9044368600682594, "eval_loss": 0.6472938656806946, "eval_runtime": 1.8885, "eval_samples_per_second": 216.048, "eval_steps_per_second": 27.006, "step": 690 }, { "epoch": 7.0, "learning_rate": 1.4444444444444446e-05, "loss": 0.053, "step": 805 }, { "epoch": 7.0, "eval_accuracy": 0.8676470588235294, "eval_combined_score": 0.8877484440875327, "eval_f1": 0.9078498293515359, "eval_loss": 0.5814068913459778, "eval_runtime": 1.8738, "eval_samples_per_second": 217.736, "eval_steps_per_second": 27.217, "step": 805 }, { "epoch": 8.0, "learning_rate": 1.3333333333333333e-05, "loss": 0.0292, "step": 920 }, { "epoch": 8.0, "eval_accuracy": 0.8578431372549019, "eval_combined_score": 0.880426585349859, "eval_f1": 0.903010033444816, "eval_loss": 0.7452187538146973, "eval_runtime": 1.8877, "eval_samples_per_second": 216.139, "eval_steps_per_second": 27.017, "step": 920 }, { "epoch": 9.0, "learning_rate": 1.2222222222222224e-05, "loss": 0.0212, "step": 1035 }, { "epoch": 9.0, "eval_accuracy": 0.8774509803921569, "eval_combined_score": 0.8951714832274373, "eval_f1": 0.9128919860627178, "eval_loss": 0.683774471282959, "eval_runtime": 1.8947, "eval_samples_per_second": 215.341, "eval_steps_per_second": 26.918, "step": 1035 }, { "epoch": 10.0, "learning_rate": 1.1111111111111113e-05, "loss": 0.0103, "step": 1150 }, { "epoch": 10.0, "eval_accuracy": 0.8602941176470589, "eval_combined_score": 0.8814291101055808, "eval_f1": 0.9025641025641027, "eval_loss": 0.789932906627655, "eval_runtime": 1.8751, "eval_samples_per_second": 217.593, "eval_steps_per_second": 27.199, "step": 1150 }, { "epoch": 11.0, "learning_rate": 1e-05, "loss": 0.0153, "step": 1265 }, { "epoch": 11.0, "eval_accuracy": 0.8676470588235294, "eval_combined_score": 0.8859511889862328, "eval_f1": 0.9042553191489361, "eval_loss": 0.7904257774353027, "eval_runtime": 1.8798, "eval_samples_per_second": 217.048, "eval_steps_per_second": 27.131, "step": 1265 }, { "epoch": 12.0, "learning_rate": 8.888888888888888e-06, "loss": 0.0136, "step": 1380 }, { "epoch": 12.0, "eval_accuracy": 0.8799019607843137, "eval_combined_score": 0.8980706385118149, "eval_f1": 0.9162393162393162, "eval_loss": 0.6983678340911865, "eval_runtime": 1.8896, "eval_samples_per_second": 215.921, "eval_steps_per_second": 26.99, "step": 1380 }, { "epoch": 13.0, "learning_rate": 7.77777777777778e-06, "loss": 0.0083, "step": 1495 }, { "epoch": 13.0, "eval_accuracy": 0.8823529411764706, "eval_combined_score": 0.9002208391889179, "eval_f1": 0.9180887372013652, "eval_loss": 0.7833622097969055, "eval_runtime": 1.8915, "eval_samples_per_second": 215.705, "eval_steps_per_second": 26.963, "step": 1495 }, { "epoch": 14.0, "learning_rate": 6.666666666666667e-06, "loss": 0.0078, "step": 1610 }, { "epoch": 14.0, "eval_accuracy": 0.875, "eval_combined_score": 0.8939102564102563, "eval_f1": 0.9128205128205128, "eval_loss": 0.8284361362457275, "eval_runtime": 1.8794, "eval_samples_per_second": 217.087, "eval_steps_per_second": 27.136, "step": 1610 }, { "epoch": 15.0, "learning_rate": 5.555555555555557e-06, "loss": 0.0065, "step": 1725 }, { "epoch": 15.0, "eval_accuracy": 0.8897058823529411, "eval_combined_score": 0.9062594591867621, "eval_f1": 0.9228130360205832, "eval_loss": 0.802143931388855, "eval_runtime": 1.8792, "eval_samples_per_second": 217.111, "eval_steps_per_second": 27.139, "step": 1725 }, { "epoch": 16.0, "learning_rate": 4.444444444444444e-06, "loss": 0.0046, "step": 1840 }, { "epoch": 16.0, "eval_accuracy": 0.8725490196078431, "eval_combined_score": 0.8922067131937521, "eval_f1": 0.9118644067796611, "eval_loss": 0.890489399433136, "eval_runtime": 1.8786, "eval_samples_per_second": 217.185, "eval_steps_per_second": 27.148, "step": 1840 }, { "epoch": 17.0, "learning_rate": 3.3333333333333333e-06, "loss": 0.005, "step": 1955 }, { "epoch": 17.0, "eval_accuracy": 0.875, "eval_combined_score": 0.8931521739130435, "eval_f1": 0.9113043478260869, "eval_loss": 0.8655802607536316, "eval_runtime": 1.8821, "eval_samples_per_second": 216.775, "eval_steps_per_second": 27.097, "step": 1955 }, { "epoch": 18.0, "learning_rate": 2.222222222222222e-06, "loss": 0.004, "step": 2070 }, { "epoch": 18.0, "eval_accuracy": 0.8700980392156863, "eval_combined_score": 0.889280453113888, "eval_f1": 0.9084628670120898, "eval_loss": 0.9055202007293701, "eval_runtime": 1.8752, "eval_samples_per_second": 217.58, "eval_steps_per_second": 27.198, "step": 2070 }, { "epoch": 19.0, "learning_rate": 1.111111111111111e-06, "loss": 0.0019, "step": 2185 }, { "epoch": 19.0, "eval_accuracy": 0.8725490196078431, "eval_combined_score": 0.8911356209150327, "eval_f1": 0.9097222222222222, "eval_loss": 0.9129809141159058, "eval_runtime": 1.8883, "eval_samples_per_second": 216.063, "eval_steps_per_second": 27.008, "step": 2185 }, { "epoch": 20.0, "learning_rate": 0.0, "loss": 0.0008, "step": 2300 }, { "epoch": 20.0, "eval_accuracy": 0.8725490196078431, "eval_combined_score": 0.8916009702850212, "eval_f1": 0.9106529209621993, "eval_loss": 0.9021580815315247, "eval_runtime": 1.8731, "eval_samples_per_second": 217.821, "eval_steps_per_second": 27.228, "step": 2300 }, { "epoch": 20.0, "step": 2300, "total_flos": 4825456755302400.0, "train_loss": 0.09379986195784548, "train_runtime": 1024.4983, "train_samples_per_second": 71.606, "train_steps_per_second": 2.245 } ], "max_steps": 2300, "num_train_epochs": 20, "total_flos": 4825456755302400.0, "trial_name": null, "trial_params": null }