| { |
| "best_metric": 0.5371652447937805, |
| "best_model_checkpoint": "../output/roberta-base-sst/checkpoint-900", |
| "epoch": 3.370786516853933, |
| "global_step": 900, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.37, |
| "eval_accuracy": 0.44868301544050865, |
| "eval_f1": 0.40183269902596275, |
| "eval_loss": 1.2189757823944092, |
| "eval_precision": 0.45215636701421513, |
| "eval_recall": 0.4461052071145046, |
| "eval_runtime": 5.4464, |
| "eval_samples_per_second": 202.152, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.75, |
| "eval_accuracy": 0.4713896457765668, |
| "eval_f1": 0.45576264052480686, |
| "eval_loss": 1.1674168109893799, |
| "eval_precision": 0.47342618027935013, |
| "eval_recall": 0.4617929878424363, |
| "eval_runtime": 5.5186, |
| "eval_samples_per_second": 199.508, |
| "step": 200 |
| }, |
| { |
| "epoch": 1.12, |
| "eval_accuracy": 0.48047229791099, |
| "eval_f1": 0.4608418062575635, |
| "eval_loss": 1.208803415298462, |
| "eval_precision": 0.47412277926758095, |
| "eval_recall": 0.49066121993560535, |
| "eval_runtime": 5.5423, |
| "eval_samples_per_second": 198.655, |
| "step": 300 |
| }, |
| { |
| "epoch": 1.5, |
| "eval_accuracy": 0.49954586739327883, |
| "eval_f1": 0.45326478521487196, |
| "eval_loss": 1.203087329864502, |
| "eval_precision": 0.5081235548351334, |
| "eval_recall": 0.48943672347517797, |
| "eval_runtime": 5.5675, |
| "eval_samples_per_second": 197.754, |
| "step": 400 |
| }, |
| { |
| "epoch": 1.87, |
| "learning_rate": 1.250936329588015e-05, |
| "loss": 1.1064, |
| "step": 500 |
| }, |
| { |
| "epoch": 1.87, |
| "eval_accuracy": 0.5313351498637602, |
| "eval_f1": 0.4925849403824431, |
| "eval_loss": 1.1195186376571655, |
| "eval_precision": 0.5255318894371125, |
| "eval_recall": 0.5062241091371705, |
| "eval_runtime": 5.5664, |
| "eval_samples_per_second": 197.795, |
| "step": 500 |
| }, |
| { |
| "epoch": 2.25, |
| "eval_accuracy": 0.5277020890099909, |
| "eval_f1": 0.5219048999186475, |
| "eval_loss": 1.1405118703842163, |
| "eval_precision": 0.5220602599838614, |
| "eval_recall": 0.5368465194722578, |
| "eval_runtime": 5.5771, |
| "eval_samples_per_second": 197.414, |
| "step": 600 |
| }, |
| { |
| "epoch": 2.62, |
| "eval_accuracy": 0.5267938237965486, |
| "eval_f1": 0.513698109548222, |
| "eval_loss": 1.1393935680389404, |
| "eval_precision": 0.519160589267, |
| "eval_recall": 0.5237418576297002, |
| "eval_runtime": 5.5559, |
| "eval_samples_per_second": 198.168, |
| "step": 700 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_accuracy": 0.5413260672116258, |
| "eval_f1": 0.5350818496505353, |
| "eval_loss": 1.1169188022613525, |
| "eval_precision": 0.545000483462316, |
| "eval_recall": 0.5401851524056742, |
| "eval_runtime": 5.5649, |
| "eval_samples_per_second": 197.849, |
| "step": 800 |
| }, |
| { |
| "epoch": 3.37, |
| "eval_accuracy": 0.5504087193460491, |
| "eval_f1": 0.5371652447937805, |
| "eval_loss": 1.1948559284210205, |
| "eval_precision": 0.5461602569131191, |
| "eval_recall": 0.5513573384419186, |
| "eval_runtime": 5.7609, |
| "eval_samples_per_second": 191.116, |
| "step": 900 |
| } |
| ], |
| "max_steps": 1335, |
| "num_train_epochs": 5, |
| "total_flos": 2757046992076800, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|