| { | |
| "best_metric": 0.27679798007011414, | |
| "best_model_checkpoint": "spa_en_mBERT/checkpoint-4480", | |
| "epoch": 6.0, | |
| "global_step": 5376, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.56, | |
| "learning_rate": 1.988839285714286e-05, | |
| "loss": 1.015, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.8975234842015372, | |
| "eval_f1": 0.7030225599300675, | |
| "eval_loss": 0.40301570296287537, | |
| "eval_precision": 0.7149695684879983, | |
| "eval_recall": 0.691468253968254, | |
| "eval_runtime": 5.8245, | |
| "eval_samples_per_second": 283.973, | |
| "eval_steps_per_second": 17.856, | |
| "step": 896 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 1.9776785714285716e-05, | |
| "loss": 0.466, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "learning_rate": 1.9665178571428575e-05, | |
| "loss": 0.3444, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.9197465890810875, | |
| "eval_f1": 0.772121694173792, | |
| "eval_loss": 0.30006563663482666, | |
| "eval_precision": 0.7738142686329215, | |
| "eval_recall": 0.770436507936508, | |
| "eval_runtime": 5.9225, | |
| "eval_samples_per_second": 279.276, | |
| "eval_steps_per_second": 17.56, | |
| "step": 1792 | |
| }, | |
| { | |
| "epoch": 2.23, | |
| "learning_rate": 1.955357142857143e-05, | |
| "loss": 0.2916, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 2.79, | |
| "learning_rate": 1.944196428571429e-05, | |
| "loss": 0.2491, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.9214545310110619, | |
| "eval_f1": 0.7768938768773725, | |
| "eval_loss": 0.2882336974143982, | |
| "eval_precision": 0.7754859967051071, | |
| "eval_recall": 0.7783068783068783, | |
| "eval_runtime": 5.8599, | |
| "eval_samples_per_second": 282.259, | |
| "eval_steps_per_second": 17.748, | |
| "step": 2688 | |
| }, | |
| { | |
| "epoch": 3.35, | |
| "learning_rate": 1.9330357142857144e-05, | |
| "loss": 0.2111, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 3.91, | |
| "learning_rate": 1.9218750000000003e-05, | |
| "loss": 0.1889, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.9311659682640557, | |
| "eval_f1": 0.8087478559176673, | |
| "eval_loss": 0.279913067817688, | |
| "eval_precision": 0.8067254540668597, | |
| "eval_recall": 0.8107804232804233, | |
| "eval_runtime": 5.8665, | |
| "eval_samples_per_second": 281.939, | |
| "eval_steps_per_second": 17.728, | |
| "step": 3584 | |
| }, | |
| { | |
| "epoch": 4.46, | |
| "learning_rate": 1.910714285714286e-05, | |
| "loss": 0.1683, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9332115266220483, | |
| "eval_f1": 0.8155864706270193, | |
| "eval_loss": 0.27679798007011414, | |
| "eval_precision": 0.8130669120546865, | |
| "eval_recall": 0.8181216931216931, | |
| "eval_runtime": 6.0326, | |
| "eval_samples_per_second": 274.178, | |
| "eval_steps_per_second": 17.24, | |
| "step": 4480 | |
| }, | |
| { | |
| "epoch": 5.02, | |
| "learning_rate": 1.8995535714285717e-05, | |
| "loss": 0.1568, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 5.58, | |
| "learning_rate": 1.8883928571428573e-05, | |
| "loss": 0.1313, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.9282068595714257, | |
| "eval_f1": 0.7986634908032288, | |
| "eval_loss": 0.30244389176368713, | |
| "eval_precision": 0.7989806724913953, | |
| "eval_recall": 0.7983465608465609, | |
| "eval_runtime": 5.8739, | |
| "eval_samples_per_second": 281.583, | |
| "eval_steps_per_second": 17.705, | |
| "step": 5376 | |
| } | |
| ], | |
| "max_steps": 89600, | |
| "num_train_epochs": 100, | |
| "total_flos": 3919265715030336.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |