| { | |
| "best_metric": 0.8548645464866416, | |
| "best_model_checkpoint": "result/InfoCSE-bert-base", | |
| "epoch": 2.0, | |
| "global_step": 31252, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.01, | |
| "eval_avg_sts": 0.645032772395593, | |
| "eval_sickr_spearman": 0.6463705264094609, | |
| "eval_stsb_spearman": 0.643695018381725, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 0.02, | |
| "eval_avg_sts": 0.685240727331801, | |
| "eval_sickr_spearman": 0.669725073110526, | |
| "eval_stsb_spearman": 0.700756381553076, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 0.02, | |
| "eval_avg_sts": 0.7027556246143734, | |
| "eval_sickr_spearman": 0.6818145493736003, | |
| "eval_stsb_spearman": 0.7236966998551464, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "learning_rate": 6.888007167541277e-06, | |
| "loss": 0.0008, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "eval_avg_sts": 0.7085517582757557, | |
| "eval_sickr_spearman": 0.6868034438177743, | |
| "eval_stsb_spearman": 0.730300072733737, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.04, | |
| "eval_avg_sts": 0.7152446421256347, | |
| "eval_sickr_spearman": 0.6908805158322469, | |
| "eval_stsb_spearman": 0.7396087684190223, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 0.05, | |
| "eval_avg_sts": 0.744333698385975, | |
| "eval_sickr_spearman": 0.7107611650906991, | |
| "eval_stsb_spearman": 0.7779062316812507, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "eval_avg_sts": 0.749906268768782, | |
| "eval_sickr_spearman": 0.7164115438638786, | |
| "eval_stsb_spearman": 0.7834009936736853, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "learning_rate": 6.776014335082554e-06, | |
| "loss": 0.0003, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "eval_avg_sts": 0.7527465185576756, | |
| "eval_sickr_spearman": 0.7194187230938174, | |
| "eval_stsb_spearman": 0.7860743140215339, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.07, | |
| "eval_avg_sts": 0.7563795190354858, | |
| "eval_sickr_spearman": 0.7197145466475747, | |
| "eval_stsb_spearman": 0.793044491423397, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 0.08, | |
| "eval_avg_sts": 0.7577088125126856, | |
| "eval_sickr_spearman": 0.7209790134240346, | |
| "eval_stsb_spearman": 0.7944386116013368, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 0.09, | |
| "eval_avg_sts": 0.7618327362445115, | |
| "eval_sickr_spearman": 0.7205304029366025, | |
| "eval_stsb_spearman": 0.8031350695524205, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "learning_rate": 6.6640215026238325e-06, | |
| "loss": 0.0004, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_avg_sts": 0.7526454517508075, | |
| "eval_sickr_spearman": 0.7131317881332785, | |
| "eval_stsb_spearman": 0.7921591153683366, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_avg_sts": 0.7584465941723788, | |
| "eval_sickr_spearman": 0.7183862465373038, | |
| "eval_stsb_spearman": 0.798506941807454, | |
| "step": 1625 | |
| }, | |
| { | |
| "epoch": 0.11, | |
| "eval_avg_sts": 0.7600830398569421, | |
| "eval_sickr_spearman": 0.7199089285150947, | |
| "eval_stsb_spearman": 0.8002571511987896, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 0.12, | |
| "eval_avg_sts": 0.753643480678329, | |
| "eval_sickr_spearman": 0.7154178764373269, | |
| "eval_stsb_spearman": 0.7918690849193311, | |
| "step": 1875 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "learning_rate": 6.55202867016511e-06, | |
| "loss": 0.0002, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "eval_avg_sts": 0.7563852037282979, | |
| "eval_sickr_spearman": 0.7193429780468495, | |
| "eval_stsb_spearman": 0.7934274294097461, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "eval_avg_sts": 0.7664707372188553, | |
| "eval_sickr_spearman": 0.7240147231282276, | |
| "eval_stsb_spearman": 0.8089267513094829, | |
| "step": 2125 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "eval_avg_sts": 0.7706419135337745, | |
| "eval_sickr_spearman": 0.7288192261739805, | |
| "eval_stsb_spearman": 0.8124646008935686, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 0.15, | |
| "eval_avg_sts": 0.7712663844837009, | |
| "eval_sickr_spearman": 0.7299219242007967, | |
| "eval_stsb_spearman": 0.8126108447666052, | |
| "step": 2375 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "learning_rate": 6.440035837706387e-06, | |
| "loss": 0.0002, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "eval_avg_sts": 0.7728606127631258, | |
| "eval_sickr_spearman": 0.7312590620337324, | |
| "eval_stsb_spearman": 0.8144621634925192, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "eval_avg_sts": 0.7729813550763709, | |
| "eval_sickr_spearman": 0.7313422519014231, | |
| "eval_stsb_spearman": 0.8146204582513188, | |
| "step": 2625 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "eval_avg_sts": 0.7754932728462534, | |
| "eval_sickr_spearman": 0.7312568526030662, | |
| "eval_stsb_spearman": 0.8197296930894405, | |
| "step": 2750 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "eval_avg_sts": 0.7712885427125948, | |
| "eval_sickr_spearman": 0.7266254056157947, | |
| "eval_stsb_spearman": 0.8159516798093949, | |
| "step": 2875 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "learning_rate": 6.328043005247664e-06, | |
| "loss": 0.0002, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "eval_avg_sts": 0.7716849957034901, | |
| "eval_sickr_spearman": 0.7262548936993011, | |
| "eval_stsb_spearman": 0.8171150977076791, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 0.2, | |
| "eval_avg_sts": 0.7711561198226983, | |
| "eval_sickr_spearman": 0.7262503241591916, | |
| "eval_stsb_spearman": 0.816061915486205, | |
| "step": 3125 | |
| }, | |
| { | |
| "epoch": 0.21, | |
| "eval_avg_sts": 0.7783568816799603, | |
| "eval_sickr_spearman": 0.7303159233258935, | |
| "eval_stsb_spearman": 0.8263978400340272, | |
| "step": 3250 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_avg_sts": 0.7809228297940308, | |
| "eval_sickr_spearman": 0.7337628272894983, | |
| "eval_stsb_spearman": 0.8280828322985634, | |
| "step": 3375 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "learning_rate": 6.2160501727889415e-06, | |
| "loss": 0.0001, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_avg_sts": 0.7797812899347809, | |
| "eval_sickr_spearman": 0.7324181485736369, | |
| "eval_stsb_spearman": 0.8271444312959251, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 0.23, | |
| "eval_avg_sts": 0.780044187865891, | |
| "eval_sickr_spearman": 0.7338939041653229, | |
| "eval_stsb_spearman": 0.8261944715664592, | |
| "step": 3625 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "eval_avg_sts": 0.7787673562775448, | |
| "eval_sickr_spearman": 0.7328702653314738, | |
| "eval_stsb_spearman": 0.8246644472236156, | |
| "step": 3750 | |
| }, | |
| { | |
| "epoch": 0.25, | |
| "eval_avg_sts": 0.779541327716536, | |
| "eval_sickr_spearman": 0.7329598913667574, | |
| "eval_stsb_spearman": 0.8261227640663145, | |
| "step": 3875 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "learning_rate": 6.104057340330219e-06, | |
| "loss": 0.0003, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "eval_avg_sts": 0.7747719384340315, | |
| "eval_sickr_spearman": 0.7285930957484098, | |
| "eval_stsb_spearman": 0.8209507811196531, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "eval_avg_sts": 0.7765396311685044, | |
| "eval_sickr_spearman": 0.7301922912707919, | |
| "eval_stsb_spearman": 0.8228869710662171, | |
| "step": 4125 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "eval_avg_sts": 0.7728155845030844, | |
| "eval_sickr_spearman": 0.7257823156922516, | |
| "eval_stsb_spearman": 0.8198488533139171, | |
| "step": 4250 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "eval_avg_sts": 0.7734186821765212, | |
| "eval_sickr_spearman": 0.7266760303967105, | |
| "eval_stsb_spearman": 0.8201613339563318, | |
| "step": 4375 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "learning_rate": 5.992064507871497e-06, | |
| "loss": 0.0004, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "eval_avg_sts": 0.7731296739509669, | |
| "eval_sickr_spearman": 0.7214541370794603, | |
| "eval_stsb_spearman": 0.8248052108224735, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "eval_avg_sts": 0.7728203601265164, | |
| "eval_sickr_spearman": 0.7219969845879138, | |
| "eval_stsb_spearman": 0.8236437356651191, | |
| "step": 4625 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "eval_avg_sts": 0.773140320693449, | |
| "eval_sickr_spearman": 0.7226297943493609, | |
| "eval_stsb_spearman": 0.823650847037537, | |
| "step": 4750 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "eval_avg_sts": 0.7776841987101548, | |
| "eval_sickr_spearman": 0.7260857761911376, | |
| "eval_stsb_spearman": 0.8292826212291721, | |
| "step": 4875 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "learning_rate": 5.880071675412773e-06, | |
| "loss": 0.0001, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "eval_avg_sts": 0.7787697170418183, | |
| "eval_sickr_spearman": 0.7268813633553585, | |
| "eval_stsb_spearman": 0.8306580707282781, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 0.33, | |
| "eval_avg_sts": 0.7794054673251014, | |
| "eval_sickr_spearman": 0.727022190544775, | |
| "eval_stsb_spearman": 0.8317887441054277, | |
| "step": 5125 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_avg_sts": 0.7794784586068343, | |
| "eval_sickr_spearman": 0.7302013691489637, | |
| "eval_stsb_spearman": 0.8287555480647049, | |
| "step": 5250 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_avg_sts": 0.7771717407788259, | |
| "eval_sickr_spearman": 0.7244288472848269, | |
| "eval_stsb_spearman": 0.829914634272825, | |
| "step": 5375 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "learning_rate": 5.7680788429540505e-06, | |
| "loss": 0.0003, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "eval_avg_sts": 0.778478777290903, | |
| "eval_sickr_spearman": 0.7256252059594475, | |
| "eval_stsb_spearman": 0.8313323486223586, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "eval_avg_sts": 0.7793214110914728, | |
| "eval_sickr_spearman": 0.726303453142855, | |
| "eval_stsb_spearman": 0.8323393690400904, | |
| "step": 5625 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "eval_avg_sts": 0.7791715295390024, | |
| "eval_sickr_spearman": 0.7257507592586067, | |
| "eval_stsb_spearman": 0.8325922998193981, | |
| "step": 5750 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "eval_avg_sts": 0.7800081020871235, | |
| "eval_sickr_spearman": 0.726603503433539, | |
| "eval_stsb_spearman": 0.8334127007407081, | |
| "step": 5875 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "learning_rate": 5.656086010495328e-06, | |
| "loss": 0.0001, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "eval_avg_sts": 0.7802662913925068, | |
| "eval_sickr_spearman": 0.7272382344390437, | |
| "eval_stsb_spearman": 0.8332943483459699, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 0.39, | |
| "eval_avg_sts": 0.7788831909074992, | |
| "eval_sickr_spearman": 0.7254892779423776, | |
| "eval_stsb_spearman": 0.8322771038726209, | |
| "step": 6125 | |
| }, | |
| { | |
| "epoch": 0.4, | |
| "eval_avg_sts": 0.7790896526834474, | |
| "eval_sickr_spearman": 0.7246235173389557, | |
| "eval_stsb_spearman": 0.8335557880279391, | |
| "step": 6250 | |
| }, | |
| { | |
| "epoch": 0.41, | |
| "eval_avg_sts": 0.7811606337604482, | |
| "eval_sickr_spearman": 0.7249414832304759, | |
| "eval_stsb_spearman": 0.8373797842904204, | |
| "step": 6375 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "learning_rate": 5.544093178036605e-06, | |
| "loss": 0.0001, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "eval_avg_sts": 0.7814213566702608, | |
| "eval_sickr_spearman": 0.7254279422258411, | |
| "eval_stsb_spearman": 0.8374147711146805, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "eval_avg_sts": 0.7818500804137162, | |
| "eval_sickr_spearman": 0.726220023119657, | |
| "eval_stsb_spearman": 0.8374801377077753, | |
| "step": 6625 | |
| }, | |
| { | |
| "epoch": 0.43, | |
| "eval_avg_sts": 0.7832040571269738, | |
| "eval_sickr_spearman": 0.7301835015792287, | |
| "eval_stsb_spearman": 0.8362246126747188, | |
| "step": 6750 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_avg_sts": 0.7841900708722672, | |
| "eval_sickr_spearman": 0.731056755034475, | |
| "eval_stsb_spearman": 0.8373233867100595, | |
| "step": 6875 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "learning_rate": 5.432100345577883e-06, | |
| "loss": 0.0001, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "eval_avg_sts": 0.7862472754964975, | |
| "eval_sickr_spearman": 0.7333967342343369, | |
| "eval_stsb_spearman": 0.839097816758658, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "eval_avg_sts": 0.7859634761320248, | |
| "eval_sickr_spearman": 0.7330241089493801, | |
| "eval_stsb_spearman": 0.8389028433146695, | |
| "step": 7125 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "eval_avg_sts": 0.7821803440191185, | |
| "eval_sickr_spearman": 0.7303841755210372, | |
| "eval_stsb_spearman": 0.8339765125171998, | |
| "step": 7250 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "eval_avg_sts": 0.7825744125697178, | |
| "eval_sickr_spearman": 0.7306357624303699, | |
| "eval_stsb_spearman": 0.8345130627090659, | |
| "step": 7375 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "learning_rate": 5.32010751311916e-06, | |
| "loss": 0.0001, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "eval_avg_sts": 0.78116110534451, | |
| "eval_sickr_spearman": 0.7276775268927966, | |
| "eval_stsb_spearman": 0.8346446837962234, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 0.49, | |
| "eval_avg_sts": 0.7799908773501631, | |
| "eval_sickr_spearman": 0.7237501678215064, | |
| "eval_stsb_spearman": 0.83623158687882, | |
| "step": 7625 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "eval_avg_sts": 0.780269211830304, | |
| "eval_sickr_spearman": 0.7244608359983847, | |
| "eval_stsb_spearman": 0.8360775876622232, | |
| "step": 7750 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "eval_avg_sts": 0.7807594418954099, | |
| "eval_sickr_spearman": 0.7247573319875622, | |
| "eval_stsb_spearman": 0.8367615518032576, | |
| "step": 7875 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "learning_rate": 5.2081146806604376e-06, | |
| "loss": 0.0001, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "eval_avg_sts": 0.7809657512161441, | |
| "eval_sickr_spearman": 0.7257775125821077, | |
| "eval_stsb_spearman": 0.8361539898501805, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 0.52, | |
| "eval_avg_sts": 0.7808305047079998, | |
| "eval_sickr_spearman": 0.7258256397457487, | |
| "eval_stsb_spearman": 0.8358353696702507, | |
| "step": 8125 | |
| }, | |
| { | |
| "epoch": 0.53, | |
| "eval_avg_sts": 0.7808244974473546, | |
| "eval_sickr_spearman": 0.7260765061885599, | |
| "eval_stsb_spearman": 0.8355724887061494, | |
| "step": 8250 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "eval_avg_sts": 0.7807531331871759, | |
| "eval_sickr_spearman": 0.725998455648723, | |
| "eval_stsb_spearman": 0.8355078107256287, | |
| "step": 8375 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "learning_rate": 5.096121848201715e-06, | |
| "loss": 0.0001, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "eval_avg_sts": 0.7805553727181309, | |
| "eval_sickr_spearman": 0.7259074847425994, | |
| "eval_stsb_spearman": 0.8352032606936624, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 0.55, | |
| "eval_avg_sts": 0.7840901636781107, | |
| "eval_sickr_spearman": 0.727197936344937, | |
| "eval_stsb_spearman": 0.8409823910112844, | |
| "step": 8625 | |
| }, | |
| { | |
| "epoch": 0.56, | |
| "eval_avg_sts": 0.7841336470257416, | |
| "eval_sickr_spearman": 0.7241774524998998, | |
| "eval_stsb_spearman": 0.8440898415515834, | |
| "step": 8750 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "eval_avg_sts": 0.7848770188208263, | |
| "eval_sickr_spearman": 0.7246812987539857, | |
| "eval_stsb_spearman": 0.8450727388876668, | |
| "step": 8875 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "learning_rate": 4.984129015742992e-06, | |
| "loss": 0.0001, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "eval_avg_sts": 0.7851602291221325, | |
| "eval_sickr_spearman": 0.7257603654788943, | |
| "eval_stsb_spearman": 0.8445600927653706, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "eval_avg_sts": 0.7881113225894085, | |
| "eval_sickr_spearman": 0.7297208179790754, | |
| "eval_stsb_spearman": 0.8465018271997418, | |
| "step": 9125 | |
| }, | |
| { | |
| "epoch": 0.59, | |
| "eval_avg_sts": 0.7883865180777926, | |
| "eval_sickr_spearman": 0.7305029084037921, | |
| "eval_stsb_spearman": 0.8462701277517931, | |
| "step": 9250 | |
| }, | |
| { | |
| "epoch": 0.6, | |
| "eval_avg_sts": 0.7905936766250409, | |
| "eval_sickr_spearman": 0.7318727073857056, | |
| "eval_stsb_spearman": 0.8493146458643761, | |
| "step": 9375 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "learning_rate": 4.872136183284269e-06, | |
| "loss": 0.0002, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "eval_avg_sts": 0.7894195399749903, | |
| "eval_sickr_spearman": 0.7297918559781024, | |
| "eval_stsb_spearman": 0.8490472239718782, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 0.62, | |
| "eval_avg_sts": 0.7888302258840285, | |
| "eval_sickr_spearman": 0.7290175946229199, | |
| "eval_stsb_spearman": 0.848642857145137, | |
| "step": 9625 | |
| }, | |
| { | |
| "epoch": 0.62, | |
| "eval_avg_sts": 0.7898168606884958, | |
| "eval_sickr_spearman": 0.7311126152054476, | |
| "eval_stsb_spearman": 0.848521106171544, | |
| "step": 9750 | |
| }, | |
| { | |
| "epoch": 0.63, | |
| "eval_avg_sts": 0.7916780015304804, | |
| "eval_sickr_spearman": 0.7336695508905056, | |
| "eval_stsb_spearman": 0.8496864521704552, | |
| "step": 9875 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "learning_rate": 4.760143350825547e-06, | |
| "loss": 0.0001, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "eval_avg_sts": 0.7916349913886156, | |
| "eval_sickr_spearman": 0.7339293030870828, | |
| "eval_stsb_spearman": 0.8493406796901484, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 0.65, | |
| "eval_avg_sts": 0.791507759549186, | |
| "eval_sickr_spearman": 0.7339989962152694, | |
| "eval_stsb_spearman": 0.8490165228831026, | |
| "step": 10125 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "eval_avg_sts": 0.789931989918206, | |
| "eval_sickr_spearman": 0.7311775052234905, | |
| "eval_stsb_spearman": 0.8486864746129216, | |
| "step": 10250 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "eval_avg_sts": 0.7899616736779131, | |
| "eval_sickr_spearman": 0.7317643492208613, | |
| "eval_stsb_spearman": 0.8481589981349649, | |
| "step": 10375 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "learning_rate": 4.648150518366825e-06, | |
| "loss": 0.0001, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "eval_avg_sts": 0.7926863693434811, | |
| "eval_sickr_spearman": 0.7347004424206716, | |
| "eval_stsb_spearman": 0.8506722962662906, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 0.68, | |
| "eval_avg_sts": 0.7925310701894714, | |
| "eval_sickr_spearman": 0.7345030826248625, | |
| "eval_stsb_spearman": 0.8505590577540805, | |
| "step": 10625 | |
| }, | |
| { | |
| "epoch": 0.69, | |
| "eval_avg_sts": 0.7921847237714013, | |
| "eval_sickr_spearman": 0.734286503995874, | |
| "eval_stsb_spearman": 0.8500829435469286, | |
| "step": 10750 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "eval_avg_sts": 0.792045037000692, | |
| "eval_sickr_spearman": 0.7345833425953655, | |
| "eval_stsb_spearman": 0.8495067314060183, | |
| "step": 10875 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "learning_rate": 4.536157685908102e-06, | |
| "loss": 0.0001, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "eval_avg_sts": 0.7924996456713199, | |
| "eval_sickr_spearman": 0.7354074602338407, | |
| "eval_stsb_spearman": 0.8495918311087991, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "eval_avg_sts": 0.7924266596358673, | |
| "eval_sickr_spearman": 0.7356516503535521, | |
| "eval_stsb_spearman": 0.8492016689181826, | |
| "step": 11125 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "eval_avg_sts": 0.7926706111519558, | |
| "eval_sickr_spearman": 0.7358917097985398, | |
| "eval_stsb_spearman": 0.8494495125053718, | |
| "step": 11250 | |
| }, | |
| { | |
| "epoch": 0.73, | |
| "eval_avg_sts": 0.7930288164708986, | |
| "eval_sickr_spearman": 0.7354914185991545, | |
| "eval_stsb_spearman": 0.8505662143426428, | |
| "step": 11375 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "learning_rate": 4.424164853449379e-06, | |
| "loss": 0.0002, | |
| "step": 11500 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "eval_avg_sts": 0.7926251189281965, | |
| "eval_sickr_spearman": 0.7351442017668584, | |
| "eval_stsb_spearman": 0.8501060360895348, | |
| "step": 11500 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "eval_avg_sts": 0.7932695687388167, | |
| "eval_sickr_spearman": 0.7365684199867013, | |
| "eval_stsb_spearman": 0.8499707174909322, | |
| "step": 11625 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "eval_avg_sts": 0.7935921856407616, | |
| "eval_sickr_spearman": 0.7367729844477262, | |
| "eval_stsb_spearman": 0.850411386833797, | |
| "step": 11750 | |
| }, | |
| { | |
| "epoch": 0.76, | |
| "eval_avg_sts": 0.794782209944985, | |
| "eval_sickr_spearman": 0.7389587838119719, | |
| "eval_stsb_spearman": 0.8506056360779983, | |
| "step": 11875 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "learning_rate": 4.312172020990656e-06, | |
| "loss": 0.0002, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "eval_avg_sts": 0.7971707208949131, | |
| "eval_sickr_spearman": 0.7394768953031847, | |
| "eval_stsb_spearman": 0.8548645464866416, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "eval_avg_sts": 0.797638118412404, | |
| "eval_sickr_spearman": 0.7421029957743136, | |
| "eval_stsb_spearman": 0.8531732410504944, | |
| "step": 12125 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "eval_avg_sts": 0.7969091025343611, | |
| "eval_sickr_spearman": 0.741429359576644, | |
| "eval_stsb_spearman": 0.8523888454920783, | |
| "step": 12250 | |
| }, | |
| { | |
| "epoch": 0.79, | |
| "eval_avg_sts": 0.7919648350492454, | |
| "eval_sickr_spearman": 0.7347034683800623, | |
| "eval_stsb_spearman": 0.8492262017184287, | |
| "step": 12375 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "learning_rate": 4.2001791885319345e-06, | |
| "loss": 0.0005, | |
| "step": 12500 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "eval_avg_sts": 0.7921636059370547, | |
| "eval_sickr_spearman": 0.7353516480939697, | |
| "eval_stsb_spearman": 0.8489755637801396, | |
| "step": 12500 | |
| }, | |
| { | |
| "epoch": 0.81, | |
| "eval_avg_sts": 0.7924202367929077, | |
| "eval_sickr_spearman": 0.736975675695795, | |
| "eval_stsb_spearman": 0.8478647978900204, | |
| "step": 12625 | |
| }, | |
| { | |
| "epoch": 0.82, | |
| "eval_avg_sts": 0.7890475112371416, | |
| "eval_sickr_spearman": 0.7355575093947334, | |
| "eval_stsb_spearman": 0.8425375130795496, | |
| "step": 12750 | |
| }, | |
| { | |
| "epoch": 0.82, | |
| "eval_avg_sts": 0.7892144058224184, | |
| "eval_sickr_spearman": 0.7356575101479275, | |
| "eval_stsb_spearman": 0.8427713014969095, | |
| "step": 12875 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "learning_rate": 4.088186356073212e-06, | |
| "loss": 0.0002, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_avg_sts": 0.7908518455947956, | |
| "eval_sickr_spearman": 0.73698621219475, | |
| "eval_stsb_spearman": 0.8447174789948412, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 0.84, | |
| "eval_avg_sts": 0.7910358332545967, | |
| "eval_sickr_spearman": 0.7372511340625426, | |
| "eval_stsb_spearman": 0.8448205324466508, | |
| "step": 13125 | |
| }, | |
| { | |
| "epoch": 0.85, | |
| "eval_avg_sts": 0.7910819619646265, | |
| "eval_sickr_spearman": 0.7366442130647706, | |
| "eval_stsb_spearman": 0.8455197108644826, | |
| "step": 13250 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "eval_avg_sts": 0.7913313391681369, | |
| "eval_sickr_spearman": 0.7369983463756739, | |
| "eval_stsb_spearman": 0.8456643319606, | |
| "step": 13375 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "learning_rate": 3.976193523614489e-06, | |
| "loss": 0.0002, | |
| "step": 13500 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "eval_avg_sts": 0.7912515138401426, | |
| "eval_sickr_spearman": 0.7371570411348254, | |
| "eval_stsb_spearman": 0.8453459865454599, | |
| "step": 13500 | |
| }, | |
| { | |
| "epoch": 0.87, | |
| "eval_avg_sts": 0.7912798783058242, | |
| "eval_sickr_spearman": 0.7375416261640404, | |
| "eval_stsb_spearman": 0.8450181304476081, | |
| "step": 13625 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "eval_avg_sts": 0.7915843291718891, | |
| "eval_sickr_spearman": 0.7376919154804402, | |
| "eval_stsb_spearman": 0.845476742863338, | |
| "step": 13750 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "eval_avg_sts": 0.7917255539871094, | |
| "eval_sickr_spearman": 0.7381062797925467, | |
| "eval_stsb_spearman": 0.8453448281816721, | |
| "step": 13875 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "learning_rate": 3.864200691155766e-06, | |
| "loss": 0.0001, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "eval_avg_sts": 0.7916416194141285, | |
| "eval_sickr_spearman": 0.7380577683800943, | |
| "eval_stsb_spearman": 0.8452254704481627, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "eval_avg_sts": 0.7924269371428458, | |
| "eval_sickr_spearman": 0.738714977941072, | |
| "eval_stsb_spearman": 0.8461388963446196, | |
| "step": 14125 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "eval_avg_sts": 0.7923356777507629, | |
| "eval_sickr_spearman": 0.7386597902055195, | |
| "eval_stsb_spearman": 0.8460115652960062, | |
| "step": 14250 | |
| }, | |
| { | |
| "epoch": 0.92, | |
| "eval_avg_sts": 0.7922805942330418, | |
| "eval_sickr_spearman": 0.7387613759850612, | |
| "eval_stsb_spearman": 0.8457998124810223, | |
| "step": 14375 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "learning_rate": 3.7522078586970435e-06, | |
| "loss": 0.0001, | |
| "step": 14500 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "eval_avg_sts": 0.7934966210957259, | |
| "eval_sickr_spearman": 0.7397510568301936, | |
| "eval_stsb_spearman": 0.8472421853612582, | |
| "step": 14500 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "eval_avg_sts": 0.7930449265696451, | |
| "eval_sickr_spearman": 0.7393639741837038, | |
| "eval_stsb_spearman": 0.8467258789555864, | |
| "step": 14625 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "eval_avg_sts": 0.7924737714972381, | |
| "eval_sickr_spearman": 0.7393996612920722, | |
| "eval_stsb_spearman": 0.845547881702404, | |
| "step": 14750 | |
| }, | |
| { | |
| "epoch": 0.95, | |
| "eval_avg_sts": 0.792308440851152, | |
| "eval_sickr_spearman": 0.739175211955052, | |
| "eval_stsb_spearman": 0.845441669747252, | |
| "step": 14875 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "learning_rate": 3.6402150262383203e-06, | |
| "loss": 0.0001, | |
| "step": 15000 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "eval_avg_sts": 0.7932488441451628, | |
| "eval_sickr_spearman": 0.7404715713828667, | |
| "eval_stsb_spearman": 0.8460261169074589, | |
| "step": 15000 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_avg_sts": 0.7931158785146848, | |
| "eval_sickr_spearman": 0.7406130710077032, | |
| "eval_stsb_spearman": 0.8456186860216665, | |
| "step": 15125 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "eval_avg_sts": 0.7945903311020877, | |
| "eval_sickr_spearman": 0.7431428210893474, | |
| "eval_stsb_spearman": 0.8460378411148278, | |
| "step": 15250 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "eval_avg_sts": 0.7948596387785098, | |
| "eval_sickr_spearman": 0.7440196288461001, | |
| "eval_stsb_spearman": 0.8456996487109196, | |
| "step": 15375 | |
| }, | |
| { | |
| "epoch": 0.99, | |
| "learning_rate": 3.5282221937795976e-06, | |
| "loss": 0.0002, | |
| "step": 15500 | |
| }, | |
| { | |
| "epoch": 0.99, | |
| "eval_avg_sts": 0.7948372805541641, | |
| "eval_sickr_spearman": 0.744097679385937, | |
| "eval_stsb_spearman": 0.8455768817223914, | |
| "step": 15500 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_avg_sts": 0.7937246352478757, | |
| "eval_sickr_spearman": 0.7439027691763012, | |
| "eval_stsb_spearman": 0.8435465013194503, | |
| "step": 15625 | |
| }, | |
| { | |
| "epoch": 1.01, | |
| "eval_avg_sts": 0.7937099307469273, | |
| "eval_sickr_spearman": 0.7440485435691657, | |
| "eval_stsb_spearman": 0.8433713179246888, | |
| "step": 15750 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_avg_sts": 0.7935877720189825, | |
| "eval_sickr_spearman": 0.7440728953375949, | |
| "eval_stsb_spearman": 0.84310264870037, | |
| "step": 15875 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "learning_rate": 3.4162293613208757e-06, | |
| "loss": 0.0001, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_avg_sts": 0.7935863758797379, | |
| "eval_sickr_spearman": 0.744390621073608, | |
| "eval_stsb_spearman": 0.8427821306858677, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 1.03, | |
| "eval_avg_sts": 0.7937197747425322, | |
| "eval_sickr_spearman": 0.7444404293257993, | |
| "eval_stsb_spearman": 0.8429991201592651, | |
| "step": 16125 | |
| }, | |
| { | |
| "epoch": 1.04, | |
| "eval_avg_sts": 0.7924446512199308, | |
| "eval_sickr_spearman": 0.7440353830473717, | |
| "eval_stsb_spearman": 0.8408539193924898, | |
| "step": 16250 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "eval_avg_sts": 0.7905555822474897, | |
| "eval_sickr_spearman": 0.7383070017654566, | |
| "eval_stsb_spearman": 0.8428041627295226, | |
| "step": 16375 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "learning_rate": 3.304236528862153e-06, | |
| "loss": 0.0001, | |
| "step": 16500 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "eval_avg_sts": 0.7899406430528368, | |
| "eval_sickr_spearman": 0.737816219970962, | |
| "eval_stsb_spearman": 0.8420650661347118, | |
| "step": 16500 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "eval_avg_sts": 0.7921524290697161, | |
| "eval_sickr_spearman": 0.7417105816755641, | |
| "eval_stsb_spearman": 0.842594276463868, | |
| "step": 16625 | |
| }, | |
| { | |
| "epoch": 1.07, | |
| "eval_avg_sts": 0.7909061020892134, | |
| "eval_sickr_spearman": 0.7410022670226564, | |
| "eval_stsb_spearman": 0.8408099371557706, | |
| "step": 16750 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "eval_avg_sts": 0.7911860344103485, | |
| "eval_sickr_spearman": 0.7404902554813262, | |
| "eval_stsb_spearman": 0.841881813339371, | |
| "step": 16875 | |
| }, | |
| { | |
| "epoch": 1.09, | |
| "learning_rate": 3.19224369640343e-06, | |
| "loss": 0.0002, | |
| "step": 17000 | |
| }, | |
| { | |
| "epoch": 1.09, | |
| "eval_avg_sts": 0.7912332320403954, | |
| "eval_sickr_spearman": 0.7405556258103834, | |
| "eval_stsb_spearman": 0.8419108382704075, | |
| "step": 17000 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "eval_avg_sts": 0.791745368257589, | |
| "eval_sickr_spearman": 0.7407413620796446, | |
| "eval_stsb_spearman": 0.8427493744355335, | |
| "step": 17125 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "eval_avg_sts": 0.7936116457907827, | |
| "eval_sickr_spearman": 0.7417212926111849, | |
| "eval_stsb_spearman": 0.8455019989703806, | |
| "step": 17250 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "eval_avg_sts": 0.7936037695250758, | |
| "eval_sickr_spearman": 0.7418167304097425, | |
| "eval_stsb_spearman": 0.8453908086404092, | |
| "step": 17375 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 3.0802508639447074e-06, | |
| "loss": 0.0002, | |
| "step": 17500 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "eval_avg_sts": 0.792413452164604, | |
| "eval_sickr_spearman": 0.7425937295377067, | |
| "eval_stsb_spearman": 0.8422331747915013, | |
| "step": 17500 | |
| }, | |
| { | |
| "epoch": 1.13, | |
| "eval_avg_sts": 0.7927184217670188, | |
| "eval_sickr_spearman": 0.7428243748868126, | |
| "eval_stsb_spearman": 0.8426124686472249, | |
| "step": 17625 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_avg_sts": 0.7926960182448954, | |
| "eval_sickr_spearman": 0.742725526880053, | |
| "eval_stsb_spearman": 0.842666509609738, | |
| "step": 17750 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_avg_sts": 0.7927521207425385, | |
| "eval_sickr_spearman": 0.7428051144151359, | |
| "eval_stsb_spearman": 0.8426991270699412, | |
| "step": 17875 | |
| }, | |
| { | |
| "epoch": 1.15, | |
| "learning_rate": 2.9682580314859847e-06, | |
| "loss": 0.0, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 1.15, | |
| "eval_avg_sts": 0.7928433137943678, | |
| "eval_sickr_spearman": 0.7426588116801555, | |
| "eval_stsb_spearman": 0.8430278159085801, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 1.16, | |
| "eval_avg_sts": 0.792833492411573, | |
| "eval_sickr_spearman": 0.7426310977346257, | |
| "eval_stsb_spearman": 0.8430358870885203, | |
| "step": 18125 | |
| }, | |
| { | |
| "epoch": 1.17, | |
| "eval_avg_sts": 0.7928841848486375, | |
| "eval_sickr_spearman": 0.742908285221025, | |
| "eval_stsb_spearman": 0.84286008447625, | |
| "step": 18250 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "eval_avg_sts": 0.7925150543842555, | |
| "eval_sickr_spearman": 0.743895084200071, | |
| "eval_stsb_spearman": 0.84113502456844, | |
| "step": 18375 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "learning_rate": 2.8562651990272623e-06, | |
| "loss": 0.0001, | |
| "step": 18500 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "eval_avg_sts": 0.7919487675309846, | |
| "eval_sickr_spearman": 0.7431525714029392, | |
| "eval_stsb_spearman": 0.84074496365903, | |
| "step": 18500 | |
| }, | |
| { | |
| "epoch": 1.19, | |
| "eval_avg_sts": 0.7919787220051326, | |
| "eval_sickr_spearman": 0.7432353770218185, | |
| "eval_stsb_spearman": 0.8407220669884469, | |
| "step": 18625 | |
| }, | |
| { | |
| "epoch": 1.2, | |
| "eval_avg_sts": 0.7920516311468476, | |
| "eval_sickr_spearman": 0.7433836010008565, | |
| "eval_stsb_spearman": 0.8407196612928387, | |
| "step": 18750 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "eval_avg_sts": 0.79208040900112, | |
| "eval_sickr_spearman": 0.7434916709790923, | |
| "eval_stsb_spearman": 0.8406691470231478, | |
| "step": 18875 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "learning_rate": 2.7442723665685396e-06, | |
| "loss": 0.0001, | |
| "step": 19000 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "eval_avg_sts": 0.7915679899923007, | |
| "eval_sickr_spearman": 0.7422913257230525, | |
| "eval_stsb_spearman": 0.8408446542615489, | |
| "step": 19000 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "eval_avg_sts": 0.7924488788916606, | |
| "eval_sickr_spearman": 0.7431180370410052, | |
| "eval_stsb_spearman": 0.8417797207423161, | |
| "step": 19125 | |
| }, | |
| { | |
| "epoch": 1.23, | |
| "eval_avg_sts": 0.7925131080137356, | |
| "eval_sickr_spearman": 0.7439811559338482, | |
| "eval_stsb_spearman": 0.8410450600936231, | |
| "step": 19250 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "eval_avg_sts": 0.7923092664958495, | |
| "eval_sickr_spearman": 0.7438394641846057, | |
| "eval_stsb_spearman": 0.8407790688070933, | |
| "step": 19375 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "learning_rate": 2.632279534109817e-06, | |
| "loss": 0.0002, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "eval_avg_sts": 0.7915084313605771, | |
| "eval_sickr_spearman": 0.7429506966835948, | |
| "eval_stsb_spearman": 0.8400661660375595, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 1.26, | |
| "eval_avg_sts": 0.7914848286255316, | |
| "eval_sickr_spearman": 0.7429546352339128, | |
| "eval_stsb_spearman": 0.8400150220171504, | |
| "step": 19625 | |
| }, | |
| { | |
| "epoch": 1.26, | |
| "eval_avg_sts": 0.7919444499131418, | |
| "eval_sickr_spearman": 0.7435056960607123, | |
| "eval_stsb_spearman": 0.8403832037655713, | |
| "step": 19750 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "eval_avg_sts": 0.7918604283998938, | |
| "eval_sickr_spearman": 0.7430511777478034, | |
| "eval_stsb_spearman": 0.8406696790519842, | |
| "step": 19875 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "learning_rate": 2.5202867016510945e-06, | |
| "loss": 0.0001, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "eval_avg_sts": 0.7901084692338984, | |
| "eval_sickr_spearman": 0.7411617302794309, | |
| "eval_stsb_spearman": 0.839055208188366, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 1.29, | |
| "eval_avg_sts": 0.789757862825201, | |
| "eval_sickr_spearman": 0.7407969340640084, | |
| "eval_stsb_spearman": 0.8387187915863936, | |
| "step": 20125 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "eval_avg_sts": 0.7898529068915039, | |
| "eval_sickr_spearman": 0.7409771947877056, | |
| "eval_stsb_spearman": 0.8387286189953022, | |
| "step": 20250 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "eval_avg_sts": 0.789768082574833, | |
| "eval_sickr_spearman": 0.74083372588771, | |
| "eval_stsb_spearman": 0.838702439261956, | |
| "step": 20375 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "learning_rate": 2.4082938691923718e-06, | |
| "loss": 0.0, | |
| "step": 20500 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "eval_avg_sts": 0.7897954058339804, | |
| "eval_sickr_spearman": 0.7408093260881794, | |
| "eval_stsb_spearman": 0.8387814855797816, | |
| "step": 20500 | |
| }, | |
| { | |
| "epoch": 1.32, | |
| "eval_avg_sts": 0.7899947832336973, | |
| "eval_sickr_spearman": 0.7409338707342086, | |
| "eval_stsb_spearman": 0.8390556957331861, | |
| "step": 20625 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "eval_avg_sts": 0.790202509592782, | |
| "eval_sickr_spearman": 0.7411228731183674, | |
| "eval_stsb_spearman": 0.8392821460671965, | |
| "step": 20750 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "eval_avg_sts": 0.7901906011266497, | |
| "eval_sickr_spearman": 0.7410648995789316, | |
| "eval_stsb_spearman": 0.839316302674368, | |
| "step": 20875 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "learning_rate": 2.296301036733649e-06, | |
| "loss": 0.0, | |
| "step": 21000 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "eval_avg_sts": 0.7902077356957227, | |
| "eval_sickr_spearman": 0.7411439107407973, | |
| "eval_stsb_spearman": 0.839271560650648, | |
| "step": 21000 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "eval_avg_sts": 0.7901431265829444, | |
| "eval_sickr_spearman": 0.7410307494658092, | |
| "eval_stsb_spearman": 0.8392555037000796, | |
| "step": 21125 | |
| }, | |
| { | |
| "epoch": 1.36, | |
| "eval_avg_sts": 0.7921962350985728, | |
| "eval_sickr_spearman": 0.7434804797324572, | |
| "eval_stsb_spearman": 0.8409119904646885, | |
| "step": 21250 | |
| }, | |
| { | |
| "epoch": 1.37, | |
| "eval_avg_sts": 0.7922085580785473, | |
| "eval_sickr_spearman": 0.7434956095294102, | |
| "eval_stsb_spearman": 0.8409215066276844, | |
| "step": 21375 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "learning_rate": 2.1843082042749267e-06, | |
| "loss": 0.0001, | |
| "step": 21500 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "eval_avg_sts": 0.7922422656604595, | |
| "eval_sickr_spearman": 0.7434714018542854, | |
| "eval_stsb_spearman": 0.8410131294666336, | |
| "step": 21500 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "eval_avg_sts": 0.7922953172658802, | |
| "eval_sickr_spearman": 0.7435230833194328, | |
| "eval_stsb_spearman": 0.8410675512123275, | |
| "step": 21625 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "eval_avg_sts": 0.7920827130593174, | |
| "eval_sickr_spearman": 0.7432143393993886, | |
| "eval_stsb_spearman": 0.8409510867192462, | |
| "step": 21750 | |
| }, | |
| { | |
| "epoch": 1.4, | |
| "eval_avg_sts": 0.7893982619162593, | |
| "eval_sickr_spearman": 0.7409595673734778, | |
| "eval_stsb_spearman": 0.8378369564590408, | |
| "step": 21875 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "learning_rate": 2.072315371816204e-06, | |
| "loss": 0.0002, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "eval_avg_sts": 0.7906089294600861, | |
| "eval_sickr_spearman": 0.7422200475685182, | |
| "eval_stsb_spearman": 0.838997811351654, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "eval_avg_sts": 0.7914097742253603, | |
| "eval_sickr_spearman": 0.7423016043787602, | |
| "eval_stsb_spearman": 0.8405179440719603, | |
| "step": 22125 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "eval_avg_sts": 0.791727396078017, | |
| "eval_sickr_spearman": 0.7433686633283093, | |
| "eval_stsb_spearman": 0.8400861288277247, | |
| "step": 22250 | |
| }, | |
| { | |
| "epoch": 1.43, | |
| "eval_avg_sts": 0.7914842385018235, | |
| "eval_sickr_spearman": 0.7423251876495663, | |
| "eval_stsb_spearman": 0.8406432893540806, | |
| "step": 22375 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "learning_rate": 1.9603225393574807e-06, | |
| "loss": 0.0001, | |
| "step": 22500 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_avg_sts": 0.7915202710875588, | |
| "eval_sickr_spearman": 0.7422767242682152, | |
| "eval_stsb_spearman": 0.8407638179069024, | |
| "step": 22500 | |
| }, | |
| { | |
| "epoch": 1.45, | |
| "eval_avg_sts": 0.7918702583757414, | |
| "eval_sickr_spearman": 0.7429271614438903, | |
| "eval_stsb_spearman": 0.8408133553075926, | |
| "step": 22625 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "eval_avg_sts": 0.7916045718347005, | |
| "eval_sickr_spearman": 0.7425266300889978, | |
| "eval_stsb_spearman": 0.840682513580403, | |
| "step": 22750 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "eval_avg_sts": 0.7915999641875153, | |
| "eval_sickr_spearman": 0.7422474733274393, | |
| "eval_stsb_spearman": 0.8409524550475914, | |
| "step": 22875 | |
| }, | |
| { | |
| "epoch": 1.47, | |
| "learning_rate": 1.8483297068987584e-06, | |
| "loss": 0.0002, | |
| "step": 23000 | |
| }, | |
| { | |
| "epoch": 1.47, | |
| "eval_avg_sts": 0.792815682844469, | |
| "eval_sickr_spearman": 0.7426967562502915, | |
| "eval_stsb_spearman": 0.8429346094386464, | |
| "step": 23000 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "eval_avg_sts": 0.7927916857497739, | |
| "eval_sickr_spearman": 0.7425698100491905, | |
| "eval_stsb_spearman": 0.8430135614503571, | |
| "step": 23125 | |
| }, | |
| { | |
| "epoch": 1.49, | |
| "eval_avg_sts": 0.7928345271530053, | |
| "eval_sickr_spearman": 0.7425940177243154, | |
| "eval_stsb_spearman": 0.8430750365816952, | |
| "step": 23250 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "eval_avg_sts": 0.7930442205998951, | |
| "eval_sickr_spearman": 0.7427970932211958, | |
| "eval_stsb_spearman": 0.8432913479785945, | |
| "step": 23375 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "learning_rate": 1.7363368744400357e-06, | |
| "loss": 0.0, | |
| "step": 23500 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "eval_avg_sts": 0.793033132084566, | |
| "eval_sickr_spearman": 0.7428263441619716, | |
| "eval_stsb_spearman": 0.8432399200071605, | |
| "step": 23500 | |
| }, | |
| { | |
| "epoch": 1.51, | |
| "eval_avg_sts": 0.7929242651260953, | |
| "eval_sickr_spearman": 0.7427599171486827, | |
| "eval_stsb_spearman": 0.8430886131035079, | |
| "step": 23625 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "eval_avg_sts": 0.7936208486615127, | |
| "eval_sickr_spearman": 0.7430878254782006, | |
| "eval_stsb_spearman": 0.8441538718448248, | |
| "step": 23750 | |
| }, | |
| { | |
| "epoch": 1.53, | |
| "eval_avg_sts": 0.7935886289185006, | |
| "eval_sickr_spearman": 0.7430728878056534, | |
| "eval_stsb_spearman": 0.8441043700313476, | |
| "step": 23875 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "learning_rate": 1.6243440419813131e-06, | |
| "loss": 0.0001, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "eval_avg_sts": 0.7935571381985222, | |
| "eval_sickr_spearman": 0.7430181323500139, | |
| "eval_stsb_spearman": 0.8440961440470305, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "eval_avg_sts": 0.7935492855380204, | |
| "eval_sickr_spearman": 0.7430870569805776, | |
| "eval_stsb_spearman": 0.8440115140954632, | |
| "step": 24125 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "eval_avg_sts": 0.7936128430055818, | |
| "eval_sickr_spearman": 0.7431491611947371, | |
| "eval_stsb_spearman": 0.8440765248164266, | |
| "step": 24250 | |
| }, | |
| { | |
| "epoch": 1.56, | |
| "eval_avg_sts": 0.7936605492215507, | |
| "eval_sickr_spearman": 0.7432605933500736, | |
| "eval_stsb_spearman": 0.844060505093028, | |
| "step": 24375 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "learning_rate": 1.5123512095225906e-06, | |
| "loss": 0.0, | |
| "step": 24500 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "eval_avg_sts": 0.793667841726459, | |
| "eval_sickr_spearman": 0.7432775483288812, | |
| "eval_stsb_spearman": 0.8440581351240368, | |
| "step": 24500 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_avg_sts": 0.7948942597846932, | |
| "eval_sickr_spearman": 0.744056468700903, | |
| "eval_stsb_spearman": 0.8457320508684834, | |
| "step": 24625 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_avg_sts": 0.7948721522573494, | |
| "eval_sickr_spearman": 0.7440626647129885, | |
| "eval_stsb_spearman": 0.8456816398017104, | |
| "step": 24750 | |
| }, | |
| { | |
| "epoch": 1.59, | |
| "eval_avg_sts": 0.7945095949089607, | |
| "eval_sickr_spearman": 0.7443504190417043, | |
| "eval_stsb_spearman": 0.8446687707762169, | |
| "step": 24875 | |
| }, | |
| { | |
| "epoch": 1.6, | |
| "learning_rate": 1.4003583770638678e-06, | |
| "loss": 0.0001, | |
| "step": 25000 | |
| }, | |
| { | |
| "epoch": 1.6, | |
| "eval_avg_sts": 0.7947724077574231, | |
| "eval_sickr_spearman": 0.7446924004839437, | |
| "eval_stsb_spearman": 0.8448524150309025, | |
| "step": 25000 | |
| }, | |
| { | |
| "epoch": 1.61, | |
| "eval_avg_sts": 0.7959915253602992, | |
| "eval_sickr_spearman": 0.7461332854959857, | |
| "eval_stsb_spearman": 0.8458497652246126, | |
| "step": 25125 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_avg_sts": 0.7955281876289857, | |
| "eval_sickr_spearman": 0.7458754244134463, | |
| "eval_stsb_spearman": 0.845180950844525, | |
| "step": 25250 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_avg_sts": 0.79543745522762, | |
| "eval_sickr_spearman": 0.7456630610129066, | |
| "eval_stsb_spearman": 0.8452118494423333, | |
| "step": 25375 | |
| }, | |
| { | |
| "epoch": 1.63, | |
| "learning_rate": 1.2883655446051453e-06, | |
| "loss": 0.0001, | |
| "step": 25500 | |
| }, | |
| { | |
| "epoch": 1.63, | |
| "eval_avg_sts": 0.795353488562289, | |
| "eval_sickr_spearman": 0.7455269408714309, | |
| "eval_stsb_spearman": 0.8451800362531473, | |
| "step": 25500 | |
| }, | |
| { | |
| "epoch": 1.64, | |
| "eval_avg_sts": 0.7953584932327289, | |
| "eval_sickr_spearman": 0.745271175256273, | |
| "eval_stsb_spearman": 0.8454458112091847, | |
| "step": 25625 | |
| }, | |
| { | |
| "epoch": 1.65, | |
| "eval_avg_sts": 0.7953254322370598, | |
| "eval_sickr_spearman": 0.7452719917849974, | |
| "eval_stsb_spearman": 0.8453788726891222, | |
| "step": 25750 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_avg_sts": 0.7952872018869009, | |
| "eval_sickr_spearman": 0.7452931735007315, | |
| "eval_stsb_spearman": 0.8452812302730703, | |
| "step": 25875 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "learning_rate": 1.1763727121464225e-06, | |
| "loss": 0.0001, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_avg_sts": 0.7952607086010879, | |
| "eval_sickr_spearman": 0.7453110410704665, | |
| "eval_stsb_spearman": 0.8452103761317094, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "eval_avg_sts": 0.7950903508557705, | |
| "eval_sickr_spearman": 0.7449656494200251, | |
| "eval_stsb_spearman": 0.8452150522915161, | |
| "step": 26125 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "eval_avg_sts": 0.7950105822340711, | |
| "eval_sickr_spearman": 0.7448497023411534, | |
| "eval_stsb_spearman": 0.8451714621269887, | |
| "step": 26250 | |
| }, | |
| { | |
| "epoch": 1.69, | |
| "eval_avg_sts": 0.7950131323560599, | |
| "eval_sickr_spearman": 0.744852055865124, | |
| "eval_stsb_spearman": 0.8451742088469958, | |
| "step": 26375 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "learning_rate": 1.0643798796877e-06, | |
| "loss": 0.0001, | |
| "step": 26500 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "eval_avg_sts": 0.7950484138603111, | |
| "eval_sickr_spearman": 0.7455690161162907, | |
| "eval_stsb_spearman": 0.8445278116043317, | |
| "step": 26500 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "eval_avg_sts": 0.7950041615346236, | |
| "eval_sickr_spearman": 0.7455438958502385, | |
| "eval_stsb_spearman": 0.8444644272190087, | |
| "step": 26625 | |
| }, | |
| { | |
| "epoch": 1.71, | |
| "eval_avg_sts": 0.7946972455858132, | |
| "eval_sickr_spearman": 0.745472569664603, | |
| "eval_stsb_spearman": 0.8439219215070236, | |
| "step": 26750 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "eval_avg_sts": 0.7944591743219949, | |
| "eval_sickr_spearman": 0.7454866427773243, | |
| "eval_stsb_spearman": 0.8434317058666653, | |
| "step": 26875 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "learning_rate": 9.523870472289774e-07, | |
| "loss": 0.0001, | |
| "step": 27000 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "eval_avg_sts": 0.7944066177099748, | |
| "eval_sickr_spearman": 0.7454395722979149, | |
| "eval_stsb_spearman": 0.8433736631220347, | |
| "step": 27000 | |
| }, | |
| { | |
| "epoch": 1.74, | |
| "eval_avg_sts": 0.7944436945207991, | |
| "eval_sickr_spearman": 0.7455328006658063, | |
| "eval_stsb_spearman": 0.8433545883757919, | |
| "step": 27125 | |
| }, | |
| { | |
| "epoch": 1.74, | |
| "eval_avg_sts": 0.7944797298738457, | |
| "eval_sickr_spearman": 0.7455790065853898, | |
| "eval_stsb_spearman": 0.8433804531623017, | |
| "step": 27250 | |
| }, | |
| { | |
| "epoch": 1.75, | |
| "eval_avg_sts": 0.7944698737687554, | |
| "eval_sickr_spearman": 0.7455735310398258, | |
| "eval_stsb_spearman": 0.8433662164976851, | |
| "step": 27375 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "learning_rate": 8.403942147702547e-07, | |
| "loss": 0.0001, | |
| "step": 27500 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "eval_avg_sts": 0.7942514496393891, | |
| "eval_sickr_spearman": 0.74535724699005, | |
| "eval_stsb_spearman": 0.8431456522887281, | |
| "step": 27500 | |
| }, | |
| { | |
| "epoch": 1.77, | |
| "eval_avg_sts": 0.7944530448391101, | |
| "eval_sickr_spearman": 0.7454611862935621, | |
| "eval_stsb_spearman": 0.8434449033846582, | |
| "step": 27625 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "eval_avg_sts": 0.7944670140899726, | |
| "eval_sickr_spearman": 0.7455168063090274, | |
| "eval_stsb_spearman": 0.8434172218709176, | |
| "step": 27750 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "eval_avg_sts": 0.7944968856863333, | |
| "eval_sickr_spearman": 0.7455487469914838, | |
| "eval_stsb_spearman": 0.8434450243811827, | |
| "step": 27875 | |
| }, | |
| { | |
| "epoch": 1.79, | |
| "learning_rate": 7.284013823115321e-07, | |
| "loss": 0.0001, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 1.79, | |
| "eval_avg_sts": 0.7944813522912897, | |
| "eval_sickr_spearman": 0.7459449555472468, | |
| "eval_stsb_spearman": 0.8430177490353326, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_avg_sts": 0.7944717848510598, | |
| "eval_sickr_spearman": 0.7458816025244499, | |
| "eval_stsb_spearman": 0.8430619671776697, | |
| "step": 28125 | |
| }, | |
| { | |
| "epoch": 1.81, | |
| "eval_avg_sts": 0.7943252967954475, | |
| "eval_sickr_spearman": 0.7455355384385883, | |
| "eval_stsb_spearman": 0.8431150551523066, | |
| "step": 28250 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "eval_avg_sts": 0.7945802673668048, | |
| "eval_sickr_spearman": 0.7459384233174512, | |
| "eval_stsb_spearman": 0.8432221114161584, | |
| "step": 28375 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "learning_rate": 6.164085498528094e-07, | |
| "loss": 0.0001, | |
| "step": 28500 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "eval_avg_sts": 0.7945695711998493, | |
| "eval_sickr_spearman": 0.7459346288604376, | |
| "eval_stsb_spearman": 0.843204513539261, | |
| "step": 28500 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "eval_avg_sts": 0.7945396361578374, | |
| "eval_sickr_spearman": 0.7462354956798459, | |
| "eval_stsb_spearman": 0.8428437766358288, | |
| "step": 28625 | |
| }, | |
| { | |
| "epoch": 1.84, | |
| "eval_avg_sts": 0.7944409539151067, | |
| "eval_sickr_spearman": 0.7461240814315593, | |
| "eval_stsb_spearman": 0.8427578263986542, | |
| "step": 28750 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "eval_avg_sts": 0.7940565976087757, | |
| "eval_sickr_spearman": 0.7457283833108623, | |
| "eval_stsb_spearman": 0.8423848119066891, | |
| "step": 28875 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "learning_rate": 5.044157173940868e-07, | |
| "loss": 0.0002, | |
| "step": 29000 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "eval_avg_sts": 0.7940545279108154, | |
| "eval_sickr_spearman": 0.7457486524356691, | |
| "eval_stsb_spearman": 0.8423604033859617, | |
| "step": 29000 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "eval_avg_sts": 0.7940541798236898, | |
| "eval_sickr_spearman": 0.7457327061099918, | |
| "eval_stsb_spearman": 0.8423756535373876, | |
| "step": 29125 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "eval_avg_sts": 0.794045870127827, | |
| "eval_sickr_spearman": 0.7457254534136746, | |
| "eval_stsb_spearman": 0.8423662868419793, | |
| "step": 29250 | |
| }, | |
| { | |
| "epoch": 1.88, | |
| "eval_avg_sts": 0.7939439159521589, | |
| "eval_sickr_spearman": 0.7456850112262637, | |
| "eval_stsb_spearman": 0.8422028206780539, | |
| "step": 29375 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "learning_rate": 3.9242288493536413e-07, | |
| "loss": 0.0001, | |
| "step": 29500 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "eval_avg_sts": 0.7938843170635432, | |
| "eval_sickr_spearman": 0.7456857797238867, | |
| "eval_stsb_spearman": 0.8420828544031996, | |
| "step": 29500 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "eval_avg_sts": 0.7938335370035037, | |
| "eval_sickr_spearman": 0.7456398619909119, | |
| "eval_stsb_spearman": 0.8420272120160953, | |
| "step": 29625 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "eval_avg_sts": 0.7937791099281831, | |
| "eval_sickr_spearman": 0.7455667765481975, | |
| "eval_stsb_spearman": 0.8419914433081688, | |
| "step": 29750 | |
| }, | |
| { | |
| "epoch": 1.91, | |
| "eval_avg_sts": 0.7937599626397398, | |
| "eval_sickr_spearman": 0.7455335691634293, | |
| "eval_stsb_spearman": 0.8419863561160503, | |
| "step": 29875 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "learning_rate": 2.804300524766415e-07, | |
| "loss": 0.0001, | |
| "step": 30000 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "eval_avg_sts": 0.7937406443684292, | |
| "eval_sickr_spearman": 0.7454874593060488, | |
| "eval_stsb_spearman": 0.8419938294308097, | |
| "step": 30000 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "eval_avg_sts": 0.7939020781683644, | |
| "eval_sickr_spearman": 0.7457190652771832, | |
| "eval_stsb_spearman": 0.8420850910595457, | |
| "step": 30125 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "eval_avg_sts": 0.7938812791358627, | |
| "eval_sickr_spearman": 0.7456977394681448, | |
| "eval_stsb_spearman": 0.8420648188035805, | |
| "step": 30250 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "eval_avg_sts": 0.7937378630658074, | |
| "eval_sickr_spearman": 0.7454741066598489, | |
| "eval_stsb_spearman": 0.842001619471766, | |
| "step": 30375 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "learning_rate": 1.6843722001791884e-07, | |
| "loss": 0.0002, | |
| "step": 30500 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "eval_avg_sts": 0.7937467005092009, | |
| "eval_sickr_spearman": 0.7454940875980473, | |
| "eval_stsb_spearman": 0.8419993134203545, | |
| "step": 30500 | |
| }, | |
| { | |
| "epoch": 1.96, | |
| "eval_avg_sts": 0.7937544654414969, | |
| "eval_sickr_spearman": 0.7454804467652388, | |
| "eval_stsb_spearman": 0.8420284841177549, | |
| "step": 30625 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "eval_avg_sts": 0.7937753802718709, | |
| "eval_sickr_spearman": 0.7455158937181001, | |
| "eval_stsb_spearman": 0.8420348668256417, | |
| "step": 30750 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "eval_avg_sts": 0.7937608907538469, | |
| "eval_sickr_spearman": 0.745488035679266, | |
| "eval_stsb_spearman": 0.8420337458284277, | |
| "step": 30875 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "learning_rate": 5.64443875591962e-08, | |
| "loss": 0.0001, | |
| "step": 31000 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "eval_avg_sts": 0.7937471629995045, | |
| "eval_sickr_spearman": 0.7454658933415031, | |
| "eval_stsb_spearman": 0.8420284326575058, | |
| "step": 31000 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "eval_avg_sts": 0.7937690011247767, | |
| "eval_sickr_spearman": 0.7455096977060146, | |
| "eval_stsb_spearman": 0.8420283045435387, | |
| "step": 31125 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_avg_sts": 0.7937804647459197, | |
| "eval_sickr_spearman": 0.7455530217595118, | |
| "eval_stsb_spearman": 0.8420079077323277, | |
| "step": 31250 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "step": 31252, | |
| "train_runtime": 9641.8618, | |
| "train_samples_per_second": 3.241 | |
| } | |
| ], | |
| "max_steps": 31252, | |
| "num_train_epochs": 2, | |
| "total_flos": 333421219511531712, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |