| { | |
| "best_global_step": 1092, | |
| "best_metric": 0.7072933549432739, | |
| "best_model_checkpoint": "projects/PetBERT_disease/model/checkpoint-1092", | |
| "epoch": 12.0, | |
| "eval_steps": 500, | |
| "global_step": 1092, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_f1": 0.6436176302232398, | |
| "eval_loss": 0.042807724326848984, | |
| "eval_precision": 0.720030737704918, | |
| "eval_recall": 0.5818671082591595, | |
| "eval_runtime": 28.0832, | |
| "eval_samples_per_second": 178.007, | |
| "eval_steps_per_second": 5.591, | |
| "step": 91 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_f1": 0.6762402088772846, | |
| "eval_loss": 0.03623269498348236, | |
| "eval_precision": 0.7126805778491172, | |
| "eval_recall": 0.6433450631339267, | |
| "eval_runtime": 28.7199, | |
| "eval_samples_per_second": 174.061, | |
| "eval_steps_per_second": 5.467, | |
| "step": 182 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_f1": 0.6854706461134799, | |
| "eval_loss": 0.04084809869527817, | |
| "eval_precision": 0.7263670064874884, | |
| "eval_recall": 0.6489339681225419, | |
| "eval_runtime": 28.935, | |
| "eval_samples_per_second": 172.766, | |
| "eval_steps_per_second": 5.426, | |
| "step": 273 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_f1": 0.6827867947443966, | |
| "eval_loss": 0.04500150680541992, | |
| "eval_precision": 0.7316611452910554, | |
| "eval_recall": 0.6400331194369696, | |
| "eval_runtime": 29.0241, | |
| "eval_samples_per_second": 172.236, | |
| "eval_steps_per_second": 5.409, | |
| "step": 364 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_f1": 0.684967037717497, | |
| "eval_loss": 0.058024812489748, | |
| "eval_precision": 0.716644052464948, | |
| "eval_recall": 0.6559718484785758, | |
| "eval_runtime": 29.1182, | |
| "eval_samples_per_second": 171.68, | |
| "eval_steps_per_second": 5.392, | |
| "step": 455 | |
| }, | |
| { | |
| "epoch": 5.4945054945054945, | |
| "grad_norm": 0.24326272308826447, | |
| "learning_rate": 4.9725824175824175e-05, | |
| "loss": 0.0324, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_f1": 0.6974244120940649, | |
| "eval_loss": 0.06078333407640457, | |
| "eval_precision": 0.759697487191998, | |
| "eval_recall": 0.6445870420202856, | |
| "eval_runtime": 29.0499, | |
| "eval_samples_per_second": 172.083, | |
| "eval_steps_per_second": 5.404, | |
| "step": 546 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_f1": 0.699815837937385, | |
| "eval_loss": 0.06435026973485947, | |
| "eval_precision": 0.7340909090909091, | |
| "eval_recall": 0.668598633823225, | |
| "eval_runtime": 29.1958, | |
| "eval_samples_per_second": 171.223, | |
| "eval_steps_per_second": 5.377, | |
| "step": 637 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_f1": 0.6904121863799283, | |
| "eval_loss": 0.06762922555208206, | |
| "eval_precision": 0.7522577495728582, | |
| "eval_recall": 0.6379631546263713, | |
| "eval_runtime": 29.1932, | |
| "eval_samples_per_second": 171.238, | |
| "eval_steps_per_second": 5.378, | |
| "step": 728 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_f1": 0.6979665708506334, | |
| "eval_loss": 0.07541821897029877, | |
| "eval_precision": 0.718544498027181, | |
| "eval_recall": 0.6785344649140964, | |
| "eval_runtime": 29.3157, | |
| "eval_samples_per_second": 170.523, | |
| "eval_steps_per_second": 5.355, | |
| "step": 819 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_f1": 0.7055853581571474, | |
| "eval_loss": 0.06385636329650879, | |
| "eval_precision": 0.7172797262617622, | |
| "eval_recall": 0.6942661974746429, | |
| "eval_runtime": 29.2092, | |
| "eval_samples_per_second": 171.144, | |
| "eval_steps_per_second": 5.375, | |
| "step": 910 | |
| }, | |
| { | |
| "epoch": 10.989010989010989, | |
| "grad_norm": 0.7826827168464661, | |
| "learning_rate": 4.9451098901098904e-05, | |
| "loss": 0.0035, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_f1": 0.7059959240587794, | |
| "eval_loss": 0.07221361249685287, | |
| "eval_precision": 0.7326357969723953, | |
| "eval_recall": 0.6812254191678742, | |
| "eval_runtime": 29.1291, | |
| "eval_samples_per_second": 171.615, | |
| "eval_steps_per_second": 5.39, | |
| "step": 1001 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_f1": 0.7072933549432739, | |
| "eval_loss": 0.06996828317642212, | |
| "eval_precision": 0.7398282097649186, | |
| "eval_recall": 0.6774994825087973, | |
| "eval_runtime": 29.1242, | |
| "eval_samples_per_second": 171.644, | |
| "eval_steps_per_second": 5.391, | |
| "step": 1092 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 91000, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 1000, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "EarlyStoppingCallback": { | |
| "args": { | |
| "early_stopping_patience": 3, | |
| "early_stopping_threshold": 0.0 | |
| }, | |
| "attributes": { | |
| "early_stopping_patience_counter": 0 | |
| } | |
| }, | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": false | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 9096344934248448.0, | |
| "train_batch_size": 32, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |