| { | |
| "best_metric": 0.8242820390801596, | |
| "best_model_checkpoint": "turkish_multilabel_intent_bert-base-turkish-128k-uncased/checkpoint-384", | |
| "epoch": 2.887218045112782, | |
| "global_step": 384, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.24, | |
| "learning_rate": 4.7987362585716124e-05, | |
| "loss": 0.0139, | |
| "step": 32 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "eval_loss": 0.009882427752017975, | |
| "eval_macro f1": 0.3392960248919277, | |
| "eval_micro f1": 0.7193911317008603, | |
| "eval_runtime": 2.3212, | |
| "eval_samples_per_second": 461.408, | |
| "eval_steps_per_second": 7.324, | |
| "step": 32 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "learning_rate": 4.491617138023029e-05, | |
| "loss": 0.0082, | |
| "step": 64 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "eval_loss": 0.00571652315557003, | |
| "eval_macro f1": 0.5888766985486856, | |
| "eval_micro f1": 0.8291472868217056, | |
| "eval_runtime": 2.3143, | |
| "eval_samples_per_second": 462.783, | |
| "eval_steps_per_second": 7.346, | |
| "step": 64 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "learning_rate": 4.184498017474446e-05, | |
| "loss": 0.0062, | |
| "step": 96 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "eval_loss": 0.004936754237860441, | |
| "eval_macro f1": 0.6479513036422692, | |
| "eval_micro f1": 0.8529040404040404, | |
| "eval_runtime": 2.335, | |
| "eval_samples_per_second": 458.676, | |
| "eval_steps_per_second": 7.281, | |
| "step": 96 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "learning_rate": 3.877378896925863e-05, | |
| "loss": 0.0046, | |
| "step": 128 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "eval_loss": 0.0039069755002856255, | |
| "eval_macro f1": 0.7036941962393284, | |
| "eval_micro f1": 0.8735053492762743, | |
| "eval_runtime": 2.3196, | |
| "eval_samples_per_second": 461.727, | |
| "eval_steps_per_second": 7.329, | |
| "step": 128 | |
| }, | |
| { | |
| "epoch": 1.2, | |
| "learning_rate": 3.57025977637728e-05, | |
| "loss": 0.0035, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 1.2, | |
| "eval_loss": 0.003501879284158349, | |
| "eval_macro f1": 0.7315796800388726, | |
| "eval_micro f1": 0.8865718799368089, | |
| "eval_runtime": 2.316, | |
| "eval_samples_per_second": 462.435, | |
| "eval_steps_per_second": 7.34, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "learning_rate": 3.263140655828696e-05, | |
| "loss": 0.0037, | |
| "step": 192 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_loss": 0.0034342026337981224, | |
| "eval_macro f1": 0.7462213705474623, | |
| "eval_micro f1": 0.8902361199744736, | |
| "eval_runtime": 2.392, | |
| "eval_samples_per_second": 447.74, | |
| "eval_steps_per_second": 7.107, | |
| "step": 192 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "learning_rate": 2.956021535280113e-05, | |
| "loss": 0.0032, | |
| "step": 224 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "eval_loss": 0.0032742032781243324, | |
| "eval_macro f1": 0.7279673266730304, | |
| "eval_micro f1": 0.8998085513720486, | |
| "eval_runtime": 2.3105, | |
| "eval_samples_per_second": 463.546, | |
| "eval_steps_per_second": 7.358, | |
| "step": 224 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "learning_rate": 2.64890241473153e-05, | |
| "loss": 0.0033, | |
| "step": 256 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "eval_loss": 0.003130522323772311, | |
| "eval_macro f1": 0.7717739019762423, | |
| "eval_micro f1": 0.912258064516129, | |
| "eval_runtime": 2.3, | |
| "eval_samples_per_second": 465.662, | |
| "eval_steps_per_second": 7.391, | |
| "step": 256 | |
| }, | |
| { | |
| "epoch": 2.17, | |
| "learning_rate": 2.3417832941829465e-05, | |
| "loss": 0.0025, | |
| "step": 288 | |
| }, | |
| { | |
| "epoch": 2.17, | |
| "eval_loss": 0.0031702849082648754, | |
| "eval_macro f1": 0.7845634595933292, | |
| "eval_micro f1": 0.9168036829990136, | |
| "eval_runtime": 2.3461, | |
| "eval_samples_per_second": 456.499, | |
| "eval_steps_per_second": 7.246, | |
| "step": 288 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "learning_rate": 2.0346641736343635e-05, | |
| "loss": 0.0022, | |
| "step": 320 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "eval_loss": 0.0030924060847610235, | |
| "eval_macro f1": 0.7838887334413882, | |
| "eval_micro f1": 0.9131561892417368, | |
| "eval_runtime": 2.2918, | |
| "eval_samples_per_second": 467.308, | |
| "eval_steps_per_second": 7.418, | |
| "step": 320 | |
| }, | |
| { | |
| "epoch": 2.65, | |
| "learning_rate": 1.7275450530857802e-05, | |
| "loss": 0.0022, | |
| "step": 352 | |
| }, | |
| { | |
| "epoch": 2.65, | |
| "eval_loss": 0.0030099288560450077, | |
| "eval_macro f1": 0.7712848231573721, | |
| "eval_micro f1": 0.908565928777671, | |
| "eval_runtime": 2.3124, | |
| "eval_samples_per_second": 463.146, | |
| "eval_steps_per_second": 7.352, | |
| "step": 352 | |
| }, | |
| { | |
| "epoch": 2.89, | |
| "learning_rate": 1.420425932537197e-05, | |
| "loss": 0.0022, | |
| "step": 384 | |
| }, | |
| { | |
| "epoch": 2.89, | |
| "eval_loss": 0.0029520909301936626, | |
| "eval_macro f1": 0.8242820390801596, | |
| "eval_micro f1": 0.913988964621876, | |
| "eval_runtime": 2.3289, | |
| "eval_samples_per_second": 459.872, | |
| "eval_steps_per_second": 7.3, | |
| "step": 384 | |
| } | |
| ], | |
| "max_steps": 532, | |
| "num_train_epochs": 4, | |
| "total_flos": 630598146840000.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |