| { |
| "best_metric": 0.8975609756097561, |
| "best_model_checkpoint": "HRAF_Model_MultiLabel_ThreeLargeClasses/checkpoint-700", |
| "epoch": 4.0, |
| "global_step": 700, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_accuracy": 0.5085714285714286, |
| "eval_f1": 0.8645660585959093, |
| "eval_loss": 0.4566337466239929, |
| "eval_roc_auc": 0.5400860231720076, |
| "eval_runtime": 93.095, |
| "eval_samples_per_second": 3.76, |
| "eval_steps_per_second": 0.473, |
| "step": 175 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_accuracy": 0.5514285714285714, |
| "eval_f1": 0.8843069873997709, |
| "eval_loss": 0.42618608474731445, |
| "eval_roc_auc": 0.634885883674972, |
| "eval_runtime": 93.2549, |
| "eval_samples_per_second": 3.753, |
| "eval_steps_per_second": 0.472, |
| "step": 350 |
| }, |
| { |
| "epoch": 2.86, |
| "learning_rate": 8.571428571428571e-06, |
| "loss": 0.425, |
| "step": 500 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_accuracy": 0.6, |
| "eval_f1": 0.8968824940047961, |
| "eval_loss": 0.39434972405433655, |
| "eval_roc_auc": 0.7227108923935367, |
| "eval_runtime": 92.9075, |
| "eval_samples_per_second": 3.767, |
| "eval_steps_per_second": 0.474, |
| "step": 525 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_accuracy": 0.6142857142857143, |
| "eval_f1": 0.8975609756097561, |
| "eval_loss": 0.3901987075805664, |
| "eval_roc_auc": 0.7456310303406052, |
| "eval_runtime": 93.1306, |
| "eval_samples_per_second": 3.758, |
| "eval_steps_per_second": 0.472, |
| "step": 700 |
| } |
| ], |
| "max_steps": 875, |
| "num_train_epochs": 5, |
| "total_flos": 624899189710512.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|