| { |
| "best_metric": 0.24747222661972046, |
| "best_model_checkpoint": "/home/jcanete/ft-data/all_results/ner/roberta_large_bne/epochs_2_bs_16_lr_5e-5/checkpoint-1000", |
| "epoch": 2.0, |
| "global_step": 1042, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.19, |
| "eval_accuracy": 0.8513695074658768, |
| "eval_f1": 0.1648726699921239, |
| "eval_loss": 0.5836164951324463, |
| "eval_precision": 0.4988085782366958, |
| "eval_recall": 0.09875766629973266, |
| "eval_runtime": 3.7205, |
| "eval_samples_per_second": 514.978, |
| "eval_steps_per_second": 32.253, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.38, |
| "eval_accuracy": 0.8838590491312712, |
| "eval_f1": 0.3543647363872084, |
| "eval_loss": 0.40415123105049133, |
| "eval_precision": 0.45510606808090776, |
| "eval_recall": 0.2901399591130681, |
| "eval_runtime": 3.5735, |
| "eval_samples_per_second": 536.167, |
| "eval_steps_per_second": 33.58, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_accuracy": 0.8917982228464991, |
| "eval_f1": 0.4051617172636281, |
| "eval_loss": 0.37282565236091614, |
| "eval_precision": 0.4273996509598604, |
| "eval_recall": 0.38512344708287466, |
| "eval_runtime": 3.5615, |
| "eval_samples_per_second": 537.975, |
| "eval_steps_per_second": 33.694, |
| "step": 300 |
| }, |
| { |
| "epoch": 0.77, |
| "eval_accuracy": 0.9021496839598155, |
| "eval_f1": 0.441752880814198, |
| "eval_loss": 0.3306070864200592, |
| "eval_precision": 0.47486437613019894, |
| "eval_recall": 0.4129580122660796, |
| "eval_runtime": 3.5725, |
| "eval_samples_per_second": 536.317, |
| "eval_steps_per_second": 33.59, |
| "step": 400 |
| }, |
| { |
| "epoch": 0.96, |
| "learning_rate": 2.6199616122840692e-05, |
| "loss": 0.3639, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.96, |
| "eval_accuracy": 0.9098293077651226, |
| "eval_f1": 0.4915268248326031, |
| "eval_loss": 0.3107258975505829, |
| "eval_precision": 0.5181247821540607, |
| "eval_recall": 0.46752634061959425, |
| "eval_runtime": 3.5465, |
| "eval_samples_per_second": 540.25, |
| "eval_steps_per_second": 33.836, |
| "step": 500 |
| }, |
| { |
| "epoch": 1.15, |
| "eval_accuracy": 0.9191425692387554, |
| "eval_f1": 0.5334455195624738, |
| "eval_loss": 0.28400444984436035, |
| "eval_precision": 0.573651827723489, |
| "eval_recall": 0.49850605441107093, |
| "eval_runtime": 3.6566, |
| "eval_samples_per_second": 523.984, |
| "eval_steps_per_second": 32.817, |
| "step": 600 |
| }, |
| { |
| "epoch": 1.34, |
| "eval_accuracy": 0.9191273015969953, |
| "eval_f1": 0.5345680983554207, |
| "eval_loss": 0.27888885140419006, |
| "eval_precision": 0.5428895735365656, |
| "eval_recall": 0.5264978770246894, |
| "eval_runtime": 3.5531, |
| "eval_samples_per_second": 539.251, |
| "eval_steps_per_second": 33.774, |
| "step": 700 |
| }, |
| { |
| "epoch": 1.54, |
| "eval_accuracy": 0.9216464624874042, |
| "eval_f1": 0.5420696324951644, |
| "eval_loss": 0.27768683433532715, |
| "eval_precision": 0.5559596627541742, |
| "eval_recall": 0.5288567384808932, |
| "eval_runtime": 3.6668, |
| "eval_samples_per_second": 522.526, |
| "eval_steps_per_second": 32.726, |
| "step": 800 |
| }, |
| { |
| "epoch": 1.73, |
| "eval_accuracy": 0.9239213411096522, |
| "eval_f1": 0.5558622929522572, |
| "eval_loss": 0.2659355401992798, |
| "eval_precision": 0.5746180963572268, |
| "eval_recall": 0.5382921843057085, |
| "eval_runtime": 3.5615, |
| "eval_samples_per_second": 537.969, |
| "eval_steps_per_second": 33.693, |
| "step": 900 |
| }, |
| { |
| "epoch": 1.92, |
| "learning_rate": 2.2072936660268714e-06, |
| "loss": 0.1284, |
| "step": 1000 |
| }, |
| { |
| "epoch": 1.92, |
| "eval_accuracy": 0.9300131301719137, |
| "eval_f1": 0.5886271324126726, |
| "eval_loss": 0.24747222661972046, |
| "eval_precision": 0.6088052428163334, |
| "eval_recall": 0.5697436703884259, |
| "eval_runtime": 3.5563, |
| "eval_samples_per_second": 538.768, |
| "eval_steps_per_second": 33.743, |
| "step": 1000 |
| }, |
| { |
| "epoch": 2.0, |
| "step": 1042, |
| "total_flos": 2679034988917632.0, |
| "train_loss": 0.2408974696944634, |
| "train_runtime": 222.5517, |
| "train_samples_per_second": 74.805, |
| "train_steps_per_second": 4.682 |
| } |
| ], |
| "max_steps": 1042, |
| "num_train_epochs": 2, |
| "total_flos": 2679034988917632.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|