{ "best_metric": 0.9132375276225795, "best_model_checkpoint": "./save_models/stsb/roberta-base_lr1e-05_run0/checkpoint-2916", "epoch": 10.0, "eval_steps": 500, "global_step": 3240, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_averaged_scores": 0.8719844165680126, "eval_loss": 0.5549536347389221, "eval_pearson": 0.8792634862673233, "eval_runtime": 1.0963, "eval_samples_per_second": 524.504, "eval_spearmanr": 0.8647053468687018, "eval_steps_per_second": 32.838, "step": 324 }, { "epoch": 1.54, "learning_rate": 8.998357963875205e-06, "loss": 1.9846, "step": 500 }, { "epoch": 2.0, "eval_averaged_scores": 0.8945047640614983, "eval_loss": 0.603453516960144, "eval_pearson": 0.9005924807835378, "eval_runtime": 0.704, "eval_samples_per_second": 816.784, "eval_spearmanr": 0.8884170473394587, "eval_steps_per_second": 51.138, "step": 648 }, { "epoch": 3.0, "eval_averaged_scores": 0.9062316400464019, "eval_loss": 0.4641549587249756, "eval_pearson": 0.9128021174279124, "eval_runtime": 0.7081, "eval_samples_per_second": 811.986, "eval_spearmanr": 0.8996611626648913, "eval_steps_per_second": 50.837, "step": 972 }, { "epoch": 3.09, "learning_rate": 7.35632183908046e-06, "loss": 0.3739, "step": 1000 }, { "epoch": 4.0, "eval_averaged_scores": 0.9065076507852758, "eval_loss": 0.4377610683441162, "eval_pearson": 0.9127118914783907, "eval_runtime": 0.6286, "eval_samples_per_second": 914.771, "eval_spearmanr": 0.9003034100921611, "eval_steps_per_second": 57.273, "step": 1296 }, { "epoch": 4.63, "learning_rate": 5.7142857142857145e-06, "loss": 0.2485, "step": 1500 }, { "epoch": 5.0, "eval_averaged_scores": 0.908379700337028, "eval_loss": 0.4117390811443329, "eval_pearson": 0.9141856508223978, "eval_runtime": 0.6332, "eval_samples_per_second": 908.107, "eval_spearmanr": 0.9025737498516583, "eval_steps_per_second": 56.855, "step": 1620 }, { "epoch": 6.0, "eval_averaged_scores": 0.9116822332416219, "eval_loss": 0.4102296233177185, "eval_pearson": 0.9173376535815415, "eval_runtime": 0.617, "eval_samples_per_second": 931.917, "eval_spearmanr": 0.9060268129017023, "eval_steps_per_second": 58.346, "step": 1944 }, { "epoch": 6.17, "learning_rate": 4.072249589490969e-06, "loss": 0.1894, "step": 2000 }, { "epoch": 7.0, "eval_averaged_scores": 0.9117323593371983, "eval_loss": 0.402465283870697, "eval_pearson": 0.9170297139907337, "eval_runtime": 0.6389, "eval_samples_per_second": 899.99, "eval_spearmanr": 0.9064350046836629, "eval_steps_per_second": 56.347, "step": 2268 }, { "epoch": 7.72, "learning_rate": 2.4302134646962236e-06, "loss": 0.1519, "step": 2500 }, { "epoch": 8.0, "eval_averaged_scores": 0.9119600828390606, "eval_loss": 0.4155682921409607, "eval_pearson": 0.9177323566058198, "eval_runtime": 0.6403, "eval_samples_per_second": 898.065, "eval_spearmanr": 0.9061878090723013, "eval_steps_per_second": 56.227, "step": 2592 }, { "epoch": 9.0, "eval_averaged_scores": 0.9132375276225795, "eval_loss": 0.39730867743492126, "eval_pearson": 0.9183296123362426, "eval_runtime": 0.6124, "eval_samples_per_second": 938.861, "eval_spearmanr": 0.9081454429089164, "eval_steps_per_second": 58.781, "step": 2916 }, { "epoch": 9.26, "learning_rate": 7.881773399014779e-07, "loss": 0.1262, "step": 3000 }, { "epoch": 10.0, "eval_averaged_scores": 0.9126844528170279, "eval_loss": 0.41949743032455444, "eval_pearson": 0.9177749306754028, "eval_runtime": 0.6141, "eval_samples_per_second": 936.342, "eval_spearmanr": 0.907593974958653, "eval_steps_per_second": 58.623, "step": 3240 }, { "epoch": 10.0, "step": 3240, "total_flos": 1693845460370892.0, "train_loss": 0.4830472233854694, "train_runtime": 291.8592, "train_samples_per_second": 177.277, "train_steps_per_second": 11.101 } ], "logging_steps": 500, "max_steps": 3240, "num_train_epochs": 10, "save_steps": 500, "total_flos": 1693845460370892.0, "trial_name": null, "trial_params": null }