| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 12.755102040816327, | |
| "global_step": 2500, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.9972193373312339, | |
| "eval_f1": 0.8363636363636364, | |
| "eval_loss": 0.010604099370539188, | |
| "eval_precision": 0.8273381294964028, | |
| "eval_recall": 0.8455882352941176, | |
| "eval_runtime": 2.6817, | |
| "eval_samples_per_second": 54.816, | |
| "eval_steps_per_second": 18.272, | |
| "step": 196 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.9978223726087976, | |
| "eval_f1": 0.855072463768116, | |
| "eval_loss": 0.008987429551780224, | |
| "eval_precision": 0.8428571428571429, | |
| "eval_recall": 0.8676470588235294, | |
| "eval_runtime": 2.5934, | |
| "eval_samples_per_second": 56.681, | |
| "eval_steps_per_second": 18.894, | |
| "step": 392 | |
| }, | |
| { | |
| "epoch": 2.55, | |
| "learning_rate": 4.149659863945579e-05, | |
| "loss": 0.0231, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.997688364769339, | |
| "eval_f1": 0.8794326241134752, | |
| "eval_loss": 0.009632805362343788, | |
| "eval_precision": 0.8493150684931506, | |
| "eval_recall": 0.9117647058823529, | |
| "eval_runtime": 2.5938, | |
| "eval_samples_per_second": 56.673, | |
| "eval_steps_per_second": 18.891, | |
| "step": 588 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.9980903882877148, | |
| "eval_f1": 0.8897058823529411, | |
| "eval_loss": 0.01180042140185833, | |
| "eval_precision": 0.8897058823529411, | |
| "eval_recall": 0.8897058823529411, | |
| "eval_runtime": 2.6016, | |
| "eval_samples_per_second": 56.505, | |
| "eval_steps_per_second": 18.835, | |
| "step": 784 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9981908941673088, | |
| "eval_f1": 0.9018181818181817, | |
| "eval_loss": 0.010586733929812908, | |
| "eval_precision": 0.8920863309352518, | |
| "eval_recall": 0.9117647058823529, | |
| "eval_runtime": 2.5999, | |
| "eval_samples_per_second": 56.54, | |
| "eval_steps_per_second": 18.847, | |
| "step": 980 | |
| }, | |
| { | |
| "epoch": 5.1, | |
| "learning_rate": 3.2993197278911564e-05, | |
| "loss": 0.0019, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.998458909846226, | |
| "eval_f1": 0.9157509157509157, | |
| "eval_loss": 0.01237014215439558, | |
| "eval_precision": 0.9124087591240876, | |
| "eval_recall": 0.9191176470588235, | |
| "eval_runtime": 2.6016, | |
| "eval_samples_per_second": 56.503, | |
| "eval_steps_per_second": 18.834, | |
| "step": 1176 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.998358403966632, | |
| "eval_f1": 0.8978102189781022, | |
| "eval_loss": 0.012939131818711758, | |
| "eval_precision": 0.8913043478260869, | |
| "eval_recall": 0.9044117647058824, | |
| "eval_runtime": 2.5832, | |
| "eval_samples_per_second": 56.905, | |
| "eval_steps_per_second": 18.968, | |
| "step": 1372 | |
| }, | |
| { | |
| "epoch": 7.65, | |
| "learning_rate": 2.448979591836735e-05, | |
| "loss": 0.0006, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.9984254078863614, | |
| "eval_f1": 0.9191176470588235, | |
| "eval_loss": 0.012535096146166325, | |
| "eval_precision": 0.9191176470588235, | |
| "eval_recall": 0.9191176470588235, | |
| "eval_runtime": 2.6125, | |
| "eval_samples_per_second": 56.268, | |
| "eval_steps_per_second": 18.756, | |
| "step": 1568 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.998358403966632, | |
| "eval_f1": 0.9010989010989011, | |
| "eval_loss": 0.013671106658875942, | |
| "eval_precision": 0.8978102189781022, | |
| "eval_recall": 0.9044117647058824, | |
| "eval_runtime": 2.6138, | |
| "eval_samples_per_second": 56.239, | |
| "eval_steps_per_second": 18.746, | |
| "step": 1764 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.9983919059264967, | |
| "eval_f1": 0.9117647058823528, | |
| "eval_loss": 0.014087404124438763, | |
| "eval_precision": 0.9117647058823529, | |
| "eval_recall": 0.9117647058823529, | |
| "eval_runtime": 2.6236, | |
| "eval_samples_per_second": 56.03, | |
| "eval_steps_per_second": 18.677, | |
| "step": 1960 | |
| }, | |
| { | |
| "epoch": 10.2, | |
| "learning_rate": 1.5986394557823133e-05, | |
| "loss": 0.0005, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.9982578980870381, | |
| "eval_f1": 0.8929889298892988, | |
| "eval_loss": 0.014975562691688538, | |
| "eval_precision": 0.8962962962962963, | |
| "eval_recall": 0.8897058823529411, | |
| "eval_runtime": 2.598, | |
| "eval_samples_per_second": 56.581, | |
| "eval_steps_per_second": 18.86, | |
| "step": 2156 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.9981573922074441, | |
| "eval_f1": 0.888888888888889, | |
| "eval_loss": 0.015556328929960728, | |
| "eval_precision": 0.8955223880597015, | |
| "eval_recall": 0.8823529411764706, | |
| "eval_runtime": 2.5873, | |
| "eval_samples_per_second": 56.817, | |
| "eval_steps_per_second": 18.939, | |
| "step": 2352 | |
| }, | |
| { | |
| "epoch": 12.76, | |
| "learning_rate": 7.482993197278912e-06, | |
| "loss": 0.0002, | |
| "step": 2500 | |
| } | |
| ], | |
| "max_steps": 2940, | |
| "num_train_epochs": 15, | |
| "total_flos": 1238088268279728.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |