{ "best_metric": 0.5371652447937805, "best_model_checkpoint": "../output/roberta-base-sst/checkpoint-900", "epoch": 3.370786516853933, "global_step": 900, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.37, "eval_accuracy": 0.44868301544050865, "eval_f1": 0.40183269902596275, "eval_loss": 1.2189757823944092, "eval_precision": 0.45215636701421513, "eval_recall": 0.4461052071145046, "eval_runtime": 5.4464, "eval_samples_per_second": 202.152, "step": 100 }, { "epoch": 0.75, "eval_accuracy": 0.4713896457765668, "eval_f1": 0.45576264052480686, "eval_loss": 1.1674168109893799, "eval_precision": 0.47342618027935013, "eval_recall": 0.4617929878424363, "eval_runtime": 5.5186, "eval_samples_per_second": 199.508, "step": 200 }, { "epoch": 1.12, "eval_accuracy": 0.48047229791099, "eval_f1": 0.4608418062575635, "eval_loss": 1.208803415298462, "eval_precision": 0.47412277926758095, "eval_recall": 0.49066121993560535, "eval_runtime": 5.5423, "eval_samples_per_second": 198.655, "step": 300 }, { "epoch": 1.5, "eval_accuracy": 0.49954586739327883, "eval_f1": 0.45326478521487196, "eval_loss": 1.203087329864502, "eval_precision": 0.5081235548351334, "eval_recall": 0.48943672347517797, "eval_runtime": 5.5675, "eval_samples_per_second": 197.754, "step": 400 }, { "epoch": 1.87, "learning_rate": 1.250936329588015e-05, "loss": 1.1064, "step": 500 }, { "epoch": 1.87, "eval_accuracy": 0.5313351498637602, "eval_f1": 0.4925849403824431, "eval_loss": 1.1195186376571655, "eval_precision": 0.5255318894371125, "eval_recall": 0.5062241091371705, "eval_runtime": 5.5664, "eval_samples_per_second": 197.795, "step": 500 }, { "epoch": 2.25, "eval_accuracy": 0.5277020890099909, "eval_f1": 0.5219048999186475, "eval_loss": 1.1405118703842163, "eval_precision": 0.5220602599838614, "eval_recall": 0.5368465194722578, "eval_runtime": 5.5771, "eval_samples_per_second": 197.414, "step": 600 }, { "epoch": 2.62, "eval_accuracy": 0.5267938237965486, "eval_f1": 0.513698109548222, "eval_loss": 1.1393935680389404, "eval_precision": 0.519160589267, "eval_recall": 0.5237418576297002, "eval_runtime": 5.5559, "eval_samples_per_second": 198.168, "step": 700 }, { "epoch": 3.0, "eval_accuracy": 0.5413260672116258, "eval_f1": 0.5350818496505353, "eval_loss": 1.1169188022613525, "eval_precision": 0.545000483462316, "eval_recall": 0.5401851524056742, "eval_runtime": 5.5649, "eval_samples_per_second": 197.849, "step": 800 }, { "epoch": 3.37, "eval_accuracy": 0.5504087193460491, "eval_f1": 0.5371652447937805, "eval_loss": 1.1948559284210205, "eval_precision": 0.5461602569131191, "eval_recall": 0.5513573384419186, "eval_runtime": 5.7609, "eval_samples_per_second": 191.116, "step": 900 } ], "max_steps": 1335, "num_train_epochs": 5, "total_flos": 2757046992076800, "trial_name": null, "trial_params": null }