| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 10.0, | |
| "global_step": 320, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.8748680042238648, | |
| "eval_f1": 0.0, | |
| "eval_loss": 0.616299569606781, | |
| "eval_precision": 0.0, | |
| "eval_recall": 0.0, | |
| "eval_runtime": 0.1116, | |
| "eval_samples_per_second": 815.287, | |
| "step": 32 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.8785638859556494, | |
| "eval_f1": 0.0, | |
| "eval_loss": 0.4105246365070343, | |
| "eval_precision": 0.0, | |
| "eval_recall": 0.0, | |
| "eval_runtime": 0.1118, | |
| "eval_samples_per_second": 814.082, | |
| "step": 64 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.883843717001056, | |
| "eval_f1": 0.3583333333333333, | |
| "eval_loss": 0.328654408454895, | |
| "eval_precision": 0.4387755102040816, | |
| "eval_recall": 0.3028169014084507, | |
| "eval_runtime": 0.1118, | |
| "eval_samples_per_second": 814.03, | |
| "step": 96 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.8912354804646251, | |
| "eval_f1": 0.36909871244635195, | |
| "eval_loss": 0.31546750664711, | |
| "eval_precision": 0.4725274725274725, | |
| "eval_recall": 0.3028169014084507, | |
| "eval_runtime": 0.1118, | |
| "eval_samples_per_second": 813.707, | |
| "step": 128 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.8933474128827877, | |
| "eval_f1": 0.41538461538461535, | |
| "eval_loss": 0.3068830370903015, | |
| "eval_precision": 0.4576271186440678, | |
| "eval_recall": 0.38028169014084506, | |
| "eval_runtime": 0.1247, | |
| "eval_samples_per_second": 730.008, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.8912354804646251, | |
| "eval_f1": 0.48135593220338985, | |
| "eval_loss": 0.330695241689682, | |
| "eval_precision": 0.46405228758169936, | |
| "eval_recall": 0.5, | |
| "eval_runtime": 0.1127, | |
| "eval_samples_per_second": 807.78, | |
| "step": 192 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.895987328405491, | |
| "eval_f1": 0.4470588235294118, | |
| "eval_loss": 0.3800097107887268, | |
| "eval_precision": 0.504424778761062, | |
| "eval_recall": 0.4014084507042254, | |
| "eval_runtime": 0.1125, | |
| "eval_samples_per_second": 808.798, | |
| "step": 224 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.899155227032735, | |
| "eval_f1": 0.49295774647887325, | |
| "eval_loss": 0.4225572347640991, | |
| "eval_precision": 0.49295774647887325, | |
| "eval_recall": 0.49295774647887325, | |
| "eval_runtime": 0.1126, | |
| "eval_samples_per_second": 808.356, | |
| "step": 256 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.8922914466737064, | |
| "eval_f1": 0.4901960784313726, | |
| "eval_loss": 0.4346790611743927, | |
| "eval_precision": 0.4573170731707317, | |
| "eval_recall": 0.528169014084507, | |
| "eval_runtime": 0.1123, | |
| "eval_samples_per_second": 810.599, | |
| "step": 288 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.8870116156282999, | |
| "eval_f1": 0.47647058823529415, | |
| "eval_loss": 0.48350322246551514, | |
| "eval_precision": 0.4090909090909091, | |
| "eval_recall": 0.5704225352112676, | |
| "eval_runtime": 0.1129, | |
| "eval_samples_per_second": 805.916, | |
| "step": 320 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 320, | |
| "total_flos": 201896658999468.0, | |
| "train_runtime": 25.0952, | |
| "train_samples_per_second": 12.751 | |
| } | |
| ], | |
| "max_steps": 320, | |
| "num_train_epochs": 10, | |
| "total_flos": 201896658999468.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |