{ "best_metric": null, "best_model_checkpoint": null, "epoch": 12.755102040816327, "global_step": 2500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.9972193373312339, "eval_f1": 0.8363636363636364, "eval_loss": 0.010604099370539188, "eval_precision": 0.8273381294964028, "eval_recall": 0.8455882352941176, "eval_runtime": 2.6817, "eval_samples_per_second": 54.816, "eval_steps_per_second": 18.272, "step": 196 }, { "epoch": 2.0, "eval_accuracy": 0.9978223726087976, "eval_f1": 0.855072463768116, "eval_loss": 0.008987429551780224, "eval_precision": 0.8428571428571429, "eval_recall": 0.8676470588235294, "eval_runtime": 2.5934, "eval_samples_per_second": 56.681, "eval_steps_per_second": 18.894, "step": 392 }, { "epoch": 2.55, "learning_rate": 4.149659863945579e-05, "loss": 0.0231, "step": 500 }, { "epoch": 3.0, "eval_accuracy": 0.997688364769339, "eval_f1": 0.8794326241134752, "eval_loss": 0.009632805362343788, "eval_precision": 0.8493150684931506, "eval_recall": 0.9117647058823529, "eval_runtime": 2.5938, "eval_samples_per_second": 56.673, "eval_steps_per_second": 18.891, "step": 588 }, { "epoch": 4.0, "eval_accuracy": 0.9980903882877148, "eval_f1": 0.8897058823529411, "eval_loss": 0.01180042140185833, "eval_precision": 0.8897058823529411, "eval_recall": 0.8897058823529411, "eval_runtime": 2.6016, "eval_samples_per_second": 56.505, "eval_steps_per_second": 18.835, "step": 784 }, { "epoch": 5.0, "eval_accuracy": 0.9981908941673088, "eval_f1": 0.9018181818181817, "eval_loss": 0.010586733929812908, "eval_precision": 0.8920863309352518, "eval_recall": 0.9117647058823529, "eval_runtime": 2.5999, "eval_samples_per_second": 56.54, "eval_steps_per_second": 18.847, "step": 980 }, { "epoch": 5.1, "learning_rate": 3.2993197278911564e-05, "loss": 0.0019, "step": 1000 }, { "epoch": 6.0, "eval_accuracy": 0.998458909846226, "eval_f1": 0.9157509157509157, "eval_loss": 0.01237014215439558, "eval_precision": 0.9124087591240876, "eval_recall": 0.9191176470588235, "eval_runtime": 2.6016, "eval_samples_per_second": 56.503, "eval_steps_per_second": 18.834, "step": 1176 }, { "epoch": 7.0, "eval_accuracy": 0.998358403966632, "eval_f1": 0.8978102189781022, "eval_loss": 0.012939131818711758, "eval_precision": 0.8913043478260869, "eval_recall": 0.9044117647058824, "eval_runtime": 2.5832, "eval_samples_per_second": 56.905, "eval_steps_per_second": 18.968, "step": 1372 }, { "epoch": 7.65, "learning_rate": 2.448979591836735e-05, "loss": 0.0006, "step": 1500 }, { "epoch": 8.0, "eval_accuracy": 0.9984254078863614, "eval_f1": 0.9191176470588235, "eval_loss": 0.012535096146166325, "eval_precision": 0.9191176470588235, "eval_recall": 0.9191176470588235, "eval_runtime": 2.6125, "eval_samples_per_second": 56.268, "eval_steps_per_second": 18.756, "step": 1568 }, { "epoch": 9.0, "eval_accuracy": 0.998358403966632, "eval_f1": 0.9010989010989011, "eval_loss": 0.013671106658875942, "eval_precision": 0.8978102189781022, "eval_recall": 0.9044117647058824, "eval_runtime": 2.6138, "eval_samples_per_second": 56.239, "eval_steps_per_second": 18.746, "step": 1764 }, { "epoch": 10.0, "eval_accuracy": 0.9983919059264967, "eval_f1": 0.9117647058823528, "eval_loss": 0.014087404124438763, "eval_precision": 0.9117647058823529, "eval_recall": 0.9117647058823529, "eval_runtime": 2.6236, "eval_samples_per_second": 56.03, "eval_steps_per_second": 18.677, "step": 1960 }, { "epoch": 10.2, "learning_rate": 1.5986394557823133e-05, "loss": 0.0005, "step": 2000 }, { "epoch": 11.0, "eval_accuracy": 0.9982578980870381, "eval_f1": 0.8929889298892988, "eval_loss": 0.014975562691688538, "eval_precision": 0.8962962962962963, "eval_recall": 0.8897058823529411, "eval_runtime": 2.598, "eval_samples_per_second": 56.581, "eval_steps_per_second": 18.86, "step": 2156 }, { "epoch": 12.0, "eval_accuracy": 0.9981573922074441, "eval_f1": 0.888888888888889, "eval_loss": 0.015556328929960728, "eval_precision": 0.8955223880597015, "eval_recall": 0.8823529411764706, "eval_runtime": 2.5873, "eval_samples_per_second": 56.817, "eval_steps_per_second": 18.939, "step": 2352 }, { "epoch": 12.76, "learning_rate": 7.482993197278912e-06, "loss": 0.0002, "step": 2500 } ], "max_steps": 2940, "num_train_epochs": 15, "total_flos": 1238088268279728.0, "trial_name": null, "trial_params": null }