| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 10.0, | |
| "global_step": 220, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 9.090909090909092e-05, | |
| "loss": 0.6837, | |
| "step": 22 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.5897435897435898, | |
| "eval_f1": 0.6666666666666666, | |
| "eval_loss": 0.6039571166038513, | |
| "eval_precision": 0.5161290322580645, | |
| "eval_recall": 0.9411764705882353, | |
| "eval_roc_auc": 0.6296791443850267, | |
| "eval_runtime": 0.069, | |
| "eval_samples_per_second": 565.227, | |
| "eval_steps_per_second": 43.479, | |
| "step": 22 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 8.090909090909092e-05, | |
| "loss": 0.3852, | |
| "step": 44 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.9230769230769231, | |
| "eval_f1": 0.9189189189189189, | |
| "eval_loss": 0.28810474276542664, | |
| "eval_precision": 0.85, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9318181818181819, | |
| "eval_runtime": 0.064, | |
| "eval_samples_per_second": 609.374, | |
| "eval_steps_per_second": 46.875, | |
| "step": 44 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 7.090909090909092e-05, | |
| "loss": 0.2148, | |
| "step": 66 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.9230769230769231, | |
| "eval_f1": 0.9189189189189189, | |
| "eval_loss": 0.38069406151771545, | |
| "eval_precision": 0.85, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9318181818181819, | |
| "eval_runtime": 0.065, | |
| "eval_samples_per_second": 600.004, | |
| "eval_steps_per_second": 46.154, | |
| "step": 66 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 6.090909090909091e-05, | |
| "loss": 0.0701, | |
| "step": 88 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.8717948717948718, | |
| "eval_f1": 0.8717948717948718, | |
| "eval_loss": 0.4933823347091675, | |
| "eval_precision": 0.7727272727272727, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.8863636363636364, | |
| "eval_runtime": 0.071, | |
| "eval_samples_per_second": 549.297, | |
| "eval_steps_per_second": 42.254, | |
| "step": 88 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 5.090909090909091e-05, | |
| "loss": 0.0164, | |
| "step": 110 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.8974358974358975, | |
| "eval_f1": 0.8947368421052632, | |
| "eval_loss": 0.4892081320285797, | |
| "eval_precision": 0.8095238095238095, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9090909090909091, | |
| "eval_runtime": 0.064, | |
| "eval_samples_per_second": 609.381, | |
| "eval_steps_per_second": 46.875, | |
| "step": 110 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "learning_rate": 4.0909090909090915e-05, | |
| "loss": 0.0039, | |
| "step": 132 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.8974358974358975, | |
| "eval_f1": 0.8947368421052632, | |
| "eval_loss": 0.49288177490234375, | |
| "eval_precision": 0.8095238095238095, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9090909090909091, | |
| "eval_runtime": 0.058, | |
| "eval_samples_per_second": 672.418, | |
| "eval_steps_per_second": 51.724, | |
| "step": 132 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "learning_rate": 3.090909090909091e-05, | |
| "loss": 0.0012, | |
| "step": 154 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.9230769230769231, | |
| "eval_f1": 0.9189189189189189, | |
| "eval_loss": 0.4065372943878174, | |
| "eval_precision": 0.85, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9318181818181819, | |
| "eval_runtime": 0.063, | |
| "eval_samples_per_second": 619.043, | |
| "eval_steps_per_second": 47.619, | |
| "step": 154 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 2.090909090909091e-05, | |
| "loss": 0.0008, | |
| "step": 176 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.9230769230769231, | |
| "eval_f1": 0.9189189189189189, | |
| "eval_loss": 0.48369330167770386, | |
| "eval_precision": 0.85, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9318181818181819, | |
| "eval_runtime": 0.059, | |
| "eval_samples_per_second": 661.03, | |
| "eval_steps_per_second": 50.848, | |
| "step": 176 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "learning_rate": 1.0909090909090909e-05, | |
| "loss": 0.0007, | |
| "step": 198 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.9230769230769231, | |
| "eval_f1": 0.9189189189189189, | |
| "eval_loss": 0.4999829828739166, | |
| "eval_precision": 0.85, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9318181818181819, | |
| "eval_runtime": 0.061, | |
| "eval_samples_per_second": 639.321, | |
| "eval_steps_per_second": 49.179, | |
| "step": 198 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "learning_rate": 9.09090909090909e-07, | |
| "loss": 0.0006, | |
| "step": 220 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.9230769230769231, | |
| "eval_f1": 0.9189189189189189, | |
| "eval_loss": 0.5037449598312378, | |
| "eval_precision": 0.85, | |
| "eval_recall": 1.0, | |
| "eval_roc_auc": 0.9318181818181819, | |
| "eval_runtime": 0.058, | |
| "eval_samples_per_second": 672.418, | |
| "eval_steps_per_second": 51.724, | |
| "step": 220 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 220, | |
| "total_flos": 197738122089864.0, | |
| "train_loss": 0.1377350079192018, | |
| "train_runtime": 17.676, | |
| "train_samples_per_second": 194.048, | |
| "train_steps_per_second": 12.446 | |
| } | |
| ], | |
| "max_steps": 220, | |
| "num_train_epochs": 10, | |
| "total_flos": 197738122089864.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |