| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 5.0, | |
| "global_step": 36725, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.0085, | |
| "step": 7345 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_EG_f1": 0.9962079135863944, | |
| "eval_ET_f1": 0.9989276960784315, | |
| "eval_TE_f1": 0.9956351941189985, | |
| "eval_loss": 0.002211587270721793, | |
| "eval_overall_accuracy": 0.9995236481225324, | |
| "eval_overall_f1": 0.9969235482594433, | |
| "eval_overall_precision": 0.9969871827605576, | |
| "eval_overall_recall": 0.9968599218809834, | |
| "eval_runtime": 329.5116, | |
| "eval_samples_per_second": 39.625, | |
| "eval_steps_per_second": 2.479, | |
| "step": 7345 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.0014, | |
| "step": 14690 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_EG_f1": 0.9987363584147042, | |
| "eval_ET_f1": 0.9995787861382348, | |
| "eval_TE_f1": 0.9985064910197986, | |
| "eval_loss": 0.0008891239413060248, | |
| "eval_overall_accuracy": 0.9998259483524637, | |
| "eval_overall_f1": 0.9989405562717792, | |
| "eval_overall_precision": 0.998927805575411, | |
| "eval_overall_recall": 0.9989533072936612, | |
| "eval_runtime": 314.9732, | |
| "eval_samples_per_second": 41.454, | |
| "eval_steps_per_second": 2.594, | |
| "step": 14690 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 1.4e-05, | |
| "loss": 0.0008, | |
| "step": 22035 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_EG_f1": 0.9983534367221903, | |
| "eval_ET_f1": 0.9996170636440224, | |
| "eval_TE_f1": 0.9983917904732731, | |
| "eval_loss": 0.0008875366183929145, | |
| "eval_overall_accuracy": 0.999835108965492, | |
| "eval_overall_f1": 0.9987874146403727, | |
| "eval_overall_precision": 0.9987491703681013, | |
| "eval_overall_recall": 0.9988256618416685, | |
| "eval_runtime": 316.3291, | |
| "eval_samples_per_second": 41.277, | |
| "eval_steps_per_second": 2.583, | |
| "step": 22035 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.0005, | |
| "step": 29380 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_EG_f1": 0.9991574754901962, | |
| "eval_ET_f1": 0.9996553968679404, | |
| "eval_TE_f1": 0.9989277782032626, | |
| "eval_loss": 0.000532182864844799, | |
| "eval_overall_accuracy": 0.9998717514176049, | |
| "eval_overall_f1": 0.9992469014462045, | |
| "eval_overall_precision": 0.9992341468395793, | |
| "eval_overall_recall": 0.9992596563784433, | |
| "eval_runtime": 328.7608, | |
| "eval_samples_per_second": 39.716, | |
| "eval_steps_per_second": 2.485, | |
| "step": 29380 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0003, | |
| "step": 36725 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_EG_f1": 0.9992341272880447, | |
| "eval_ET_f1": 0.999846825457609, | |
| "eval_TE_f1": 0.9992724487842237, | |
| "eval_loss": 0.00026392185827717185, | |
| "eval_overall_accuracy": 0.9999404560153166, | |
| "eval_overall_f1": 0.999451131562488, | |
| "eval_overall_precision": 0.9994383743490248, | |
| "eval_overall_recall": 0.9994638891016313, | |
| "eval_runtime": 321.322, | |
| "eval_samples_per_second": 40.635, | |
| "eval_steps_per_second": 2.543, | |
| "step": 36725 | |
| } | |
| ], | |
| "max_steps": 73450, | |
| "num_train_epochs": 10, | |
| "total_flos": 8945844807242016.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |