{ "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "global_step": 5860, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.43, "learning_rate": 4.573378839590444e-05, "loss": 0.1236, "step": 500 }, { "epoch": 0.85, "learning_rate": 4.1467576791808876e-05, "loss": 0.0826, "step": 1000 }, { "epoch": 1.0, "eval_accuracy": 0.9701500564728661, "eval_f1": 0.8742703188145488, "eval_loss": 0.07586850225925446, "eval_precision": 0.9289122137404581, "eval_recall": 0.8256997455470738, "eval_runtime": 3.6496, "eval_samples_per_second": 285.24, "eval_steps_per_second": 35.895, "step": 1172 }, { "epoch": 1.28, "learning_rate": 3.720136518771331e-05, "loss": 0.0549, "step": 1500 }, { "epoch": 1.71, "learning_rate": 3.293515358361775e-05, "loss": 0.0457, "step": 2000 }, { "epoch": 2.0, "eval_accuracy": 0.9726241058462862, "eval_f1": 0.8871037776812852, "eval_loss": 0.09076694399118423, "eval_precision": 0.9088078291814946, "eval_recall": 0.8664122137404581, "eval_runtime": 3.5668, "eval_samples_per_second": 291.861, "eval_steps_per_second": 36.728, "step": 2344 }, { "epoch": 2.13, "learning_rate": 2.8668941979522183e-05, "loss": 0.0377, "step": 2500 }, { "epoch": 2.56, "learning_rate": 2.4402730375426623e-05, "loss": 0.0204, "step": 3000 }, { "epoch": 2.99, "learning_rate": 2.013651877133106e-05, "loss": 0.0198, "step": 3500 }, { "epoch": 3.0, "eval_accuracy": 0.9724089711181627, "eval_f1": 0.8868527594289368, "eval_loss": 0.11024652421474457, "eval_precision": 0.891220556745182, "eval_recall": 0.8825275657336726, "eval_runtime": 3.591, "eval_samples_per_second": 289.895, "eval_steps_per_second": 36.481, "step": 3516 }, { "epoch": 3.41, "learning_rate": 1.5870307167235497e-05, "loss": 0.0097, "step": 4000 }, { "epoch": 3.84, "learning_rate": 1.1604095563139932e-05, "loss": 0.0092, "step": 4500 }, { "epoch": 4.0, "eval_accuracy": 0.9726241058462862, "eval_f1": 0.8877923192447972, "eval_loss": 0.13143494725227356, "eval_precision": 0.8983933999131567, "eval_recall": 0.8774385072094996, "eval_runtime": 3.6011, "eval_samples_per_second": 289.076, "eval_steps_per_second": 36.377, "step": 4688 }, { "epoch": 4.27, "learning_rate": 7.337883959044369e-06, "loss": 0.0065, "step": 5000 }, { "epoch": 4.69, "learning_rate": 3.0716723549488057e-06, "loss": 0.0038, "step": 5500 }, { "epoch": 5.0, "eval_accuracy": 0.9724089711181627, "eval_f1": 0.8878464818763325, "eval_loss": 0.1649477779865265, "eval_precision": 0.8927958833619211, "eval_recall": 0.8829516539440203, "eval_runtime": 3.5283, "eval_samples_per_second": 295.043, "eval_steps_per_second": 37.128, "step": 5860 }, { "epoch": 5.0, "step": 5860, "total_flos": 1012549907373102.0, "train_loss": 0.03548831426039491, "train_runtime": 710.9927, "train_samples_per_second": 65.901, "train_steps_per_second": 8.242 } ], "max_steps": 5860, "num_train_epochs": 5, "total_flos": 1012549907373102.0, "trial_name": null, "trial_params": null }