| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 10.0, | |
| "global_step": 910, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.9533894011551323, | |
| "eval_f1": 0.6969990319457888, | |
| "eval_loss": 0.20486080646514893, | |
| "eval_precision": 0.6617647058823529, | |
| "eval_recall": 0.7361963190184049, | |
| "eval_runtime": 1.2373, | |
| "eval_samples_per_second": 130.123, | |
| "eval_steps_per_second": 33.137, | |
| "step": 91 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "learning_rate": 4.4505494505494504e-05, | |
| "loss": 0.5036, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.9722362954706657, | |
| "eval_f1": 0.8234146341463414, | |
| "eval_loss": 0.11564752459526062, | |
| "eval_precision": 0.7873134328358209, | |
| "eval_recall": 0.8629856850715747, | |
| "eval_runtime": 1.2367, | |
| "eval_samples_per_second": 130.181, | |
| "eval_steps_per_second": 33.152, | |
| "step": 182 | |
| }, | |
| { | |
| "epoch": 2.2, | |
| "learning_rate": 3.901098901098901e-05, | |
| "loss": 0.1442, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.9771000101327388, | |
| "eval_f1": 0.8632812499999999, | |
| "eval_loss": 0.10779214650392532, | |
| "eval_precision": 0.8261682242990654, | |
| "eval_recall": 0.9038854805725971, | |
| "eval_runtime": 1.2508, | |
| "eval_samples_per_second": 128.715, | |
| "eval_steps_per_second": 32.778, | |
| "step": 273 | |
| }, | |
| { | |
| "epoch": 3.3, | |
| "learning_rate": 3.3516483516483513e-05, | |
| "loss": 0.0757, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.9780119566318776, | |
| "eval_f1": 0.8851148851148851, | |
| "eval_loss": 0.1178947389125824, | |
| "eval_precision": 0.865234375, | |
| "eval_recall": 0.9059304703476483, | |
| "eval_runtime": 1.2453, | |
| "eval_samples_per_second": 129.288, | |
| "eval_steps_per_second": 32.924, | |
| "step": 364 | |
| }, | |
| { | |
| "epoch": 4.4, | |
| "learning_rate": 2.8021978021978025e-05, | |
| "loss": 0.0526, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9836862904042962, | |
| "eval_f1": 0.897876643073812, | |
| "eval_loss": 0.0906740128993988, | |
| "eval_precision": 0.888, | |
| "eval_recall": 0.9079754601226994, | |
| "eval_runtime": 1.2584, | |
| "eval_samples_per_second": 127.94, | |
| "eval_steps_per_second": 32.581, | |
| "step": 455 | |
| }, | |
| { | |
| "epoch": 5.49, | |
| "learning_rate": 2.252747252747253e-05, | |
| "loss": 0.0342, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.9831796534603303, | |
| "eval_f1": 0.9130869130869131, | |
| "eval_loss": 0.0972292423248291, | |
| "eval_precision": 0.892578125, | |
| "eval_recall": 0.934560327198364, | |
| "eval_runtime": 1.2748, | |
| "eval_samples_per_second": 126.296, | |
| "eval_steps_per_second": 32.162, | |
| "step": 546 | |
| }, | |
| { | |
| "epoch": 6.59, | |
| "learning_rate": 1.7032967032967035e-05, | |
| "loss": 0.0245, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.9833823082379167, | |
| "eval_f1": 0.9107321965897693, | |
| "eval_loss": 0.10643576085567474, | |
| "eval_precision": 0.8937007874015748, | |
| "eval_recall": 0.9284253578732107, | |
| "eval_runtime": 1.2478, | |
| "eval_samples_per_second": 129.031, | |
| "eval_steps_per_second": 32.859, | |
| "step": 637 | |
| }, | |
| { | |
| "epoch": 7.69, | |
| "learning_rate": 1.153846153846154e-05, | |
| "loss": 0.0188, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.9850035464586078, | |
| "eval_f1": 0.9169169169169169, | |
| "eval_loss": 0.09653466939926147, | |
| "eval_precision": 0.8980392156862745, | |
| "eval_recall": 0.9366053169734151, | |
| "eval_runtime": 1.2451, | |
| "eval_samples_per_second": 129.306, | |
| "eval_steps_per_second": 32.929, | |
| "step": 728 | |
| }, | |
| { | |
| "epoch": 8.79, | |
| "learning_rate": 6.043956043956044e-06, | |
| "loss": 0.0159, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.984598236903435, | |
| "eval_f1": 0.9201213346814965, | |
| "eval_loss": 0.09986742585897446, | |
| "eval_precision": 0.91, | |
| "eval_recall": 0.9304703476482618, | |
| "eval_runtime": 1.2461, | |
| "eval_samples_per_second": 129.208, | |
| "eval_steps_per_second": 32.904, | |
| "step": 819 | |
| }, | |
| { | |
| "epoch": 9.89, | |
| "learning_rate": 5.494505494505495e-07, | |
| "loss": 0.0141, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.985104873847401, | |
| "eval_f1": 0.911088911088911, | |
| "eval_loss": 0.09563781321048737, | |
| "eval_precision": 0.890625, | |
| "eval_recall": 0.9325153374233128, | |
| "eval_runtime": 1.2493, | |
| "eval_samples_per_second": 128.877, | |
| "eval_steps_per_second": 32.819, | |
| "step": 910 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 910, | |
| "total_flos": 1883034567828480.0, | |
| "train_loss": 0.09724931471295409, | |
| "train_runtime": 322.9196, | |
| "train_samples_per_second": 44.624, | |
| "train_steps_per_second": 2.818 | |
| } | |
| ], | |
| "max_steps": 910, | |
| "num_train_epochs": 10, | |
| "total_flos": 1883034567828480.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |