| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 10.0, |
| "global_step": 220, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "learning_rate": 9.090909090909092e-05, |
| "loss": 0.6837, |
| "step": 22 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_accuracy": 0.5897435897435898, |
| "eval_f1": 0.6666666666666666, |
| "eval_loss": 0.6039571166038513, |
| "eval_precision": 0.5161290322580645, |
| "eval_recall": 0.9411764705882353, |
| "eval_roc_auc": 0.6296791443850267, |
| "eval_runtime": 0.069, |
| "eval_samples_per_second": 565.227, |
| "eval_steps_per_second": 43.479, |
| "step": 22 |
| }, |
| { |
| "epoch": 2.0, |
| "learning_rate": 8.090909090909092e-05, |
| "loss": 0.3852, |
| "step": 44 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_accuracy": 0.9230769230769231, |
| "eval_f1": 0.9189189189189189, |
| "eval_loss": 0.28810474276542664, |
| "eval_precision": 0.85, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9318181818181819, |
| "eval_runtime": 0.064, |
| "eval_samples_per_second": 609.374, |
| "eval_steps_per_second": 46.875, |
| "step": 44 |
| }, |
| { |
| "epoch": 3.0, |
| "learning_rate": 7.090909090909092e-05, |
| "loss": 0.2148, |
| "step": 66 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_accuracy": 0.9230769230769231, |
| "eval_f1": 0.9189189189189189, |
| "eval_loss": 0.38069406151771545, |
| "eval_precision": 0.85, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9318181818181819, |
| "eval_runtime": 0.065, |
| "eval_samples_per_second": 600.004, |
| "eval_steps_per_second": 46.154, |
| "step": 66 |
| }, |
| { |
| "epoch": 4.0, |
| "learning_rate": 6.090909090909091e-05, |
| "loss": 0.0701, |
| "step": 88 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_accuracy": 0.8717948717948718, |
| "eval_f1": 0.8717948717948718, |
| "eval_loss": 0.4933823347091675, |
| "eval_precision": 0.7727272727272727, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.8863636363636364, |
| "eval_runtime": 0.071, |
| "eval_samples_per_second": 549.297, |
| "eval_steps_per_second": 42.254, |
| "step": 88 |
| }, |
| { |
| "epoch": 5.0, |
| "learning_rate": 5.090909090909091e-05, |
| "loss": 0.0164, |
| "step": 110 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_accuracy": 0.8974358974358975, |
| "eval_f1": 0.8947368421052632, |
| "eval_loss": 0.4892081320285797, |
| "eval_precision": 0.8095238095238095, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9090909090909091, |
| "eval_runtime": 0.064, |
| "eval_samples_per_second": 609.381, |
| "eval_steps_per_second": 46.875, |
| "step": 110 |
| }, |
| { |
| "epoch": 6.0, |
| "learning_rate": 4.0909090909090915e-05, |
| "loss": 0.0039, |
| "step": 132 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_accuracy": 0.8974358974358975, |
| "eval_f1": 0.8947368421052632, |
| "eval_loss": 0.49288177490234375, |
| "eval_precision": 0.8095238095238095, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9090909090909091, |
| "eval_runtime": 0.058, |
| "eval_samples_per_second": 672.418, |
| "eval_steps_per_second": 51.724, |
| "step": 132 |
| }, |
| { |
| "epoch": 7.0, |
| "learning_rate": 3.090909090909091e-05, |
| "loss": 0.0012, |
| "step": 154 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_accuracy": 0.9230769230769231, |
| "eval_f1": 0.9189189189189189, |
| "eval_loss": 0.4065372943878174, |
| "eval_precision": 0.85, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9318181818181819, |
| "eval_runtime": 0.063, |
| "eval_samples_per_second": 619.043, |
| "eval_steps_per_second": 47.619, |
| "step": 154 |
| }, |
| { |
| "epoch": 8.0, |
| "learning_rate": 2.090909090909091e-05, |
| "loss": 0.0008, |
| "step": 176 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_accuracy": 0.9230769230769231, |
| "eval_f1": 0.9189189189189189, |
| "eval_loss": 0.48369330167770386, |
| "eval_precision": 0.85, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9318181818181819, |
| "eval_runtime": 0.059, |
| "eval_samples_per_second": 661.03, |
| "eval_steps_per_second": 50.848, |
| "step": 176 |
| }, |
| { |
| "epoch": 9.0, |
| "learning_rate": 1.0909090909090909e-05, |
| "loss": 0.0007, |
| "step": 198 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_accuracy": 0.9230769230769231, |
| "eval_f1": 0.9189189189189189, |
| "eval_loss": 0.4999829828739166, |
| "eval_precision": 0.85, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9318181818181819, |
| "eval_runtime": 0.061, |
| "eval_samples_per_second": 639.321, |
| "eval_steps_per_second": 49.179, |
| "step": 198 |
| }, |
| { |
| "epoch": 10.0, |
| "learning_rate": 9.09090909090909e-07, |
| "loss": 0.0006, |
| "step": 220 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_accuracy": 0.9230769230769231, |
| "eval_f1": 0.9189189189189189, |
| "eval_loss": 0.5037449598312378, |
| "eval_precision": 0.85, |
| "eval_recall": 1.0, |
| "eval_roc_auc": 0.9318181818181819, |
| "eval_runtime": 0.058, |
| "eval_samples_per_second": 672.418, |
| "eval_steps_per_second": 51.724, |
| "step": 220 |
| }, |
| { |
| "epoch": 10.0, |
| "step": 220, |
| "total_flos": 197738122089864.0, |
| "train_loss": 0.1377350079192018, |
| "train_runtime": 17.676, |
| "train_samples_per_second": 194.048, |
| "train_steps_per_second": 12.446 |
| } |
| ], |
| "max_steps": 220, |
| "num_train_epochs": 10, |
| "total_flos": 197738122089864.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|