{ "best_metric": null, "best_model_checkpoint": null, "epoch": 18.06451612903226, "global_step": 140, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.9, "eval_accuracy": 0.7258883248730964, "eval_f1": 0.0, "eval_loss": 1.5211623907089233, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 0.0934, "eval_samples_per_second": 85.695, "eval_steps_per_second": 10.712, "step": 7 }, { "epoch": 1.94, "eval_accuracy": 0.7326565143824028, "eval_f1": 0.0, "eval_loss": 1.0808664560317993, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 0.075, "eval_samples_per_second": 106.603, "eval_steps_per_second": 13.325, "step": 15 }, { "epoch": 2.97, "eval_accuracy": 0.7681895093062606, "eval_f1": 0.17142857142857143, "eval_loss": 0.902431309223175, "eval_precision": 0.2, "eval_recall": 0.15, "eval_runtime": 0.0865, "eval_samples_per_second": 92.481, "eval_steps_per_second": 11.56, "step": 23 }, { "epoch": 4.0, "eval_accuracy": 0.7969543147208121, "eval_f1": 0.2518518518518518, "eval_loss": 0.7922185063362122, "eval_precision": 0.22666666666666666, "eval_recall": 0.2833333333333333, "eval_runtime": 0.0722, "eval_samples_per_second": 110.797, "eval_steps_per_second": 13.85, "step": 31 }, { "epoch": 4.9, "eval_accuracy": 0.8155668358714044, "eval_f1": 0.32876712328767127, "eval_loss": 0.7233745455741882, "eval_precision": 0.27906976744186046, "eval_recall": 0.4, "eval_runtime": 0.0672, "eval_samples_per_second": 118.965, "eval_steps_per_second": 14.871, "step": 38 }, { "epoch": 5.94, "eval_accuracy": 0.8358714043993232, "eval_f1": 0.4305555555555556, "eval_loss": 0.6560729146003723, "eval_precision": 0.36904761904761907, "eval_recall": 0.5166666666666667, "eval_runtime": 0.0878, "eval_samples_per_second": 91.083, "eval_steps_per_second": 11.385, "step": 46 }, { "epoch": 6.97, "eval_accuracy": 0.8443316412859561, "eval_f1": 0.4347826086956522, "eval_loss": 0.626990795135498, "eval_precision": 0.38461538461538464, "eval_recall": 0.5, "eval_runtime": 0.0846, "eval_samples_per_second": 94.599, "eval_steps_per_second": 11.825, "step": 54 }, { "epoch": 8.0, "eval_accuracy": 0.8494077834179357, "eval_f1": 0.48951048951048953, "eval_loss": 0.5750179886817932, "eval_precision": 0.42168674698795183, "eval_recall": 0.5833333333333334, "eval_runtime": 0.0711, "eval_samples_per_second": 112.546, "eval_steps_per_second": 14.068, "step": 62 }, { "epoch": 8.9, "eval_accuracy": 0.8595600676818951, "eval_f1": 0.5109489051094891, "eval_loss": 0.5483719110488892, "eval_precision": 0.45454545454545453, "eval_recall": 0.5833333333333334, "eval_runtime": 0.104, "eval_samples_per_second": 76.947, "eval_steps_per_second": 9.618, "step": 69 }, { "epoch": 9.94, "eval_accuracy": 0.8629441624365483, "eval_f1": 0.5285714285714286, "eval_loss": 0.5253370404243469, "eval_precision": 0.4625, "eval_recall": 0.6166666666666667, "eval_runtime": 0.0872, "eval_samples_per_second": 91.721, "eval_steps_per_second": 11.465, "step": 77 }, { "epoch": 10.97, "eval_accuracy": 0.868020304568528, "eval_f1": 0.5179856115107914, "eval_loss": 0.5097917914390564, "eval_precision": 0.45569620253164556, "eval_recall": 0.6, "eval_runtime": 0.0862, "eval_samples_per_second": 92.832, "eval_steps_per_second": 11.604, "step": 85 }, { "epoch": 12.0, "eval_accuracy": 0.8781725888324873, "eval_f1": 0.5547445255474452, "eval_loss": 0.49227389693260193, "eval_precision": 0.4935064935064935, "eval_recall": 0.6333333333333333, "eval_runtime": 0.0683, "eval_samples_per_second": 117.18, "eval_steps_per_second": 14.647, "step": 93 }, { "epoch": 12.9, "eval_accuracy": 0.868020304568528, "eval_f1": 0.5294117647058824, "eval_loss": 0.49868977069854736, "eval_precision": 0.47368421052631576, "eval_recall": 0.6, "eval_runtime": 0.0863, "eval_samples_per_second": 92.658, "eval_steps_per_second": 11.582, "step": 100 }, { "epoch": 13.94, "eval_accuracy": 0.871404399323181, "eval_f1": 0.5652173913043479, "eval_loss": 0.5003769397735596, "eval_precision": 0.5, "eval_recall": 0.65, "eval_runtime": 0.0861, "eval_samples_per_second": 92.934, "eval_steps_per_second": 11.617, "step": 108 }, { "epoch": 14.97, "eval_accuracy": 0.8815566835871405, "eval_f1": 0.5588235294117647, "eval_loss": 0.48066699504852295, "eval_precision": 0.5, "eval_recall": 0.6333333333333333, "eval_runtime": 0.073, "eval_samples_per_second": 109.637, "eval_steps_per_second": 13.705, "step": 116 }, { "epoch": 16.0, "eval_accuracy": 0.8798646362098139, "eval_f1": 0.5481481481481482, "eval_loss": 0.48719707131385803, "eval_precision": 0.49333333333333335, "eval_recall": 0.6166666666666667, "eval_runtime": 0.0729, "eval_samples_per_second": 109.707, "eval_steps_per_second": 13.713, "step": 124 }, { "epoch": 16.9, "eval_accuracy": 0.8866328257191202, "eval_f1": 0.6029411764705882, "eval_loss": 0.48052239418029785, "eval_precision": 0.5394736842105263, "eval_recall": 0.6833333333333333, "eval_runtime": 0.0836, "eval_samples_per_second": 95.684, "eval_steps_per_second": 11.96, "step": 131 }, { "epoch": 17.94, "eval_accuracy": 0.8866328257191202, "eval_f1": 0.5882352941176471, "eval_loss": 0.48192963004112244, "eval_precision": 0.5263157894736842, "eval_recall": 0.6666666666666666, "eval_runtime": 0.0874, "eval_samples_per_second": 91.531, "eval_steps_per_second": 11.441, "step": 139 }, { "epoch": 18.06, "eval_accuracy": 0.8866328257191202, "eval_f1": 0.5882352941176471, "eval_loss": 0.48198172450065613, "eval_precision": 0.5263157894736842, "eval_recall": 0.6666666666666666, "eval_runtime": 0.0703, "eval_samples_per_second": 113.867, "eval_steps_per_second": 14.233, "step": 140 }, { "epoch": 18.06, "step": 140, "total_flos": 142825785914880.0, "train_loss": 0.5361384800502232, "train_runtime": 994.5385, "train_samples_per_second": 2.433, "train_steps_per_second": 0.141 } ], "max_steps": 140, "num_train_epochs": 20, "total_flos": 142825785914880.0, "trial_name": null, "trial_params": null }