{ "best_global_step": 1092, "best_metric": 0.7072933549432739, "best_model_checkpoint": "projects/PetBERT_disease/model/checkpoint-1092", "epoch": 12.0, "eval_steps": 500, "global_step": 1092, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_f1": 0.6436176302232398, "eval_loss": 0.042807724326848984, "eval_precision": 0.720030737704918, "eval_recall": 0.5818671082591595, "eval_runtime": 28.0832, "eval_samples_per_second": 178.007, "eval_steps_per_second": 5.591, "step": 91 }, { "epoch": 2.0, "eval_f1": 0.6762402088772846, "eval_loss": 0.03623269498348236, "eval_precision": 0.7126805778491172, "eval_recall": 0.6433450631339267, "eval_runtime": 28.7199, "eval_samples_per_second": 174.061, "eval_steps_per_second": 5.467, "step": 182 }, { "epoch": 3.0, "eval_f1": 0.6854706461134799, "eval_loss": 0.04084809869527817, "eval_precision": 0.7263670064874884, "eval_recall": 0.6489339681225419, "eval_runtime": 28.935, "eval_samples_per_second": 172.766, "eval_steps_per_second": 5.426, "step": 273 }, { "epoch": 4.0, "eval_f1": 0.6827867947443966, "eval_loss": 0.04500150680541992, "eval_precision": 0.7316611452910554, "eval_recall": 0.6400331194369696, "eval_runtime": 29.0241, "eval_samples_per_second": 172.236, "eval_steps_per_second": 5.409, "step": 364 }, { "epoch": 5.0, "eval_f1": 0.684967037717497, "eval_loss": 0.058024812489748, "eval_precision": 0.716644052464948, "eval_recall": 0.6559718484785758, "eval_runtime": 29.1182, "eval_samples_per_second": 171.68, "eval_steps_per_second": 5.392, "step": 455 }, { "epoch": 5.4945054945054945, "grad_norm": 0.24326272308826447, "learning_rate": 4.9725824175824175e-05, "loss": 0.0324, "step": 500 }, { "epoch": 6.0, "eval_f1": 0.6974244120940649, "eval_loss": 0.06078333407640457, "eval_precision": 0.759697487191998, "eval_recall": 0.6445870420202856, "eval_runtime": 29.0499, "eval_samples_per_second": 172.083, "eval_steps_per_second": 5.404, "step": 546 }, { "epoch": 7.0, "eval_f1": 0.699815837937385, "eval_loss": 0.06435026973485947, "eval_precision": 0.7340909090909091, "eval_recall": 0.668598633823225, "eval_runtime": 29.1958, "eval_samples_per_second": 171.223, "eval_steps_per_second": 5.377, "step": 637 }, { "epoch": 8.0, "eval_f1": 0.6904121863799283, "eval_loss": 0.06762922555208206, "eval_precision": 0.7522577495728582, "eval_recall": 0.6379631546263713, "eval_runtime": 29.1932, "eval_samples_per_second": 171.238, "eval_steps_per_second": 5.378, "step": 728 }, { "epoch": 9.0, "eval_f1": 0.6979665708506334, "eval_loss": 0.07541821897029877, "eval_precision": 0.718544498027181, "eval_recall": 0.6785344649140964, "eval_runtime": 29.3157, "eval_samples_per_second": 170.523, "eval_steps_per_second": 5.355, "step": 819 }, { "epoch": 10.0, "eval_f1": 0.7055853581571474, "eval_loss": 0.06385636329650879, "eval_precision": 0.7172797262617622, "eval_recall": 0.6942661974746429, "eval_runtime": 29.2092, "eval_samples_per_second": 171.144, "eval_steps_per_second": 5.375, "step": 910 }, { "epoch": 10.989010989010989, "grad_norm": 0.7826827168464661, "learning_rate": 4.9451098901098904e-05, "loss": 0.0035, "step": 1000 }, { "epoch": 11.0, "eval_f1": 0.7059959240587794, "eval_loss": 0.07221361249685287, "eval_precision": 0.7326357969723953, "eval_recall": 0.6812254191678742, "eval_runtime": 29.1291, "eval_samples_per_second": 171.615, "eval_steps_per_second": 5.39, "step": 1001 }, { "epoch": 12.0, "eval_f1": 0.7072933549432739, "eval_loss": 0.06996828317642212, "eval_precision": 0.7398282097649186, "eval_recall": 0.6774994825087973, "eval_runtime": 29.1242, "eval_samples_per_second": 171.644, "eval_steps_per_second": 5.391, "step": 1092 } ], "logging_steps": 500, "max_steps": 91000, "num_input_tokens_seen": 0, "num_train_epochs": 1000, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 3, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 9096344934248448.0, "train_batch_size": 32, "trial_name": null, "trial_params": null }