| { | |
| "best_metric": 0.3130991458892822, | |
| "best_model_checkpoint": "/gdrive/MyDrive/Marefa/Tebyan/models/huggingface/model-xlm-roberta-large/checkpoint-13000", | |
| "epoch": 9.0, | |
| "global_step": 58500, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.4403, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.900120719929763, | |
| "eval_f1": 0.7773765268189059, | |
| "eval_loss": 0.3497047424316406, | |
| "eval_precision": 0.7735151130839146, | |
| "eval_recall": 0.7812766865926558, | |
| "eval_runtime": 26.5811, | |
| "eval_samples_per_second": 70.99, | |
| "eval_steps_per_second": 35.514, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.307, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.904587357330992, | |
| "eval_f1": 0.7846807172066689, | |
| "eval_loss": 0.3130991458892822, | |
| "eval_precision": 0.7710179270554296, | |
| "eval_recall": 0.798836464560205, | |
| "eval_runtime": 26.8623, | |
| "eval_samples_per_second": 70.247, | |
| "eval_steps_per_second": 35.142, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 1.4e-05, | |
| "loss": 0.2386, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.9074187884108867, | |
| "eval_f1": 0.7895801055644548, | |
| "eval_loss": 0.348012775182724, | |
| "eval_precision": 0.7771517187903851, | |
| "eval_recall": 0.8024124679760888, | |
| "eval_runtime": 26.5101, | |
| "eval_samples_per_second": 71.18, | |
| "eval_steps_per_second": 35.609, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.1883, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.9088235294117647, | |
| "eval_f1": 0.7946725265301746, | |
| "eval_loss": 0.3668019771575928, | |
| "eval_precision": 0.7980086114101184, | |
| "eval_recall": 0.791364218616567, | |
| "eval_runtime": 26.9144, | |
| "eval_samples_per_second": 70.111, | |
| "eval_steps_per_second": 35.074, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 1e-05, | |
| "loss": 0.1439, | |
| "step": 32500 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9110074626865672, | |
| "eval_f1": 0.801425039215165, | |
| "eval_loss": 0.40606749057769775, | |
| "eval_precision": 0.7984319542300153, | |
| "eval_recall": 0.8044406490179334, | |
| "eval_runtime": 26.8012, | |
| "eval_samples_per_second": 70.407, | |
| "eval_steps_per_second": 35.222, | |
| "step": 32500 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "learning_rate": 8.000000000000001e-06, | |
| "loss": 0.1108, | |
| "step": 39000 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.9115561896400352, | |
| "eval_f1": 0.8033741926980361, | |
| "eval_loss": 0.46604597568511963, | |
| "eval_precision": 0.7936871712068337, | |
| "eval_recall": 0.8133005977796754, | |
| "eval_runtime": 26.6526, | |
| "eval_samples_per_second": 70.8, | |
| "eval_steps_per_second": 35.419, | |
| "step": 39000 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "learning_rate": 6e-06, | |
| "loss": 0.0825, | |
| "step": 45500 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.9102502194907814, | |
| "eval_f1": 0.8003274619061452, | |
| "eval_loss": 0.5183274149894714, | |
| "eval_precision": 0.7920652344362553, | |
| "eval_recall": 0.8087638770281811, | |
| "eval_runtime": 26.7116, | |
| "eval_samples_per_second": 70.643, | |
| "eval_steps_per_second": 35.34, | |
| "step": 45500 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 4.000000000000001e-06, | |
| "loss": 0.0601, | |
| "step": 52000 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.9106014047410009, | |
| "eval_f1": 0.8013862969874699, | |
| "eval_loss": 0.5683603882789612, | |
| "eval_precision": 0.800575263662512, | |
| "eval_recall": 0.802198975234842, | |
| "eval_runtime": 26.5594, | |
| "eval_samples_per_second": 71.048, | |
| "eval_steps_per_second": 35.543, | |
| "step": 52000 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "learning_rate": 2.0000000000000003e-06, | |
| "loss": 0.0431, | |
| "step": 58500 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.91078797190518, | |
| "eval_f1": 0.8022889236230693, | |
| "eval_loss": 0.6140836477279663, | |
| "eval_precision": 0.7964862448056388, | |
| "eval_recall": 0.8081767719897524, | |
| "eval_runtime": 26.6356, | |
| "eval_samples_per_second": 70.845, | |
| "eval_steps_per_second": 35.441, | |
| "step": 58500 | |
| } | |
| ], | |
| "max_steps": 65000, | |
| "num_train_epochs": 10, | |
| "total_flos": 2.5323970171833972e+16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |