| { | |
| "best_metric": 0.8631831216150027, | |
| "best_model_checkpoint": "result/InfoCSE-bert-large", | |
| "epoch": 2.0, | |
| "global_step": 31252, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.01, | |
| "eval_avg_sts": 0.6667446229182062, | |
| "eval_sickr_spearman": 0.6627723790529534, | |
| "eval_stsb_spearman": 0.6707168667834591, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 0.02, | |
| "eval_avg_sts": 0.7051305088963267, | |
| "eval_sickr_spearman": 0.6969365172570714, | |
| "eval_stsb_spearman": 0.713324500535582, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 0.02, | |
| "eval_avg_sts": 0.725875395370044, | |
| "eval_sickr_spearman": 0.716654533206054, | |
| "eval_stsb_spearman": 0.735096257534034, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "learning_rate": 6.888007167541277e-06, | |
| "loss": 0.001, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "eval_avg_sts": 0.7357340574594278, | |
| "eval_sickr_spearman": 0.7235103965631273, | |
| "eval_stsb_spearman": 0.7479577183557282, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.04, | |
| "eval_avg_sts": 0.7464037729944727, | |
| "eval_sickr_spearman": 0.7301059313504061, | |
| "eval_stsb_spearman": 0.7627016146385392, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 0.05, | |
| "eval_avg_sts": 0.7591284137806686, | |
| "eval_sickr_spearman": 0.7344878567657066, | |
| "eval_stsb_spearman": 0.7837689707956308, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "eval_avg_sts": 0.7608889169495914, | |
| "eval_sickr_spearman": 0.7373875423906269, | |
| "eval_stsb_spearman": 0.7843902915085559, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "learning_rate": 6.776014335082554e-06, | |
| "loss": 0.0002, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "eval_avg_sts": 0.7633437897321462, | |
| "eval_sickr_spearman": 0.7394359247736582, | |
| "eval_stsb_spearman": 0.7872516546906342, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.07, | |
| "eval_avg_sts": 0.7689886003242912, | |
| "eval_sickr_spearman": 0.7459672900094155, | |
| "eval_stsb_spearman": 0.7920099106391669, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 0.08, | |
| "eval_avg_sts": 0.7695141299706598, | |
| "eval_sickr_spearman": 0.749662274611948, | |
| "eval_stsb_spearman": 0.7893659853293715, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 0.09, | |
| "eval_avg_sts": 0.771575990947651, | |
| "eval_sickr_spearman": 0.7507335602984238, | |
| "eval_stsb_spearman": 0.7924184215968783, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "learning_rate": 6.6640215026238325e-06, | |
| "loss": 0.0003, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_avg_sts": 0.7721249223821594, | |
| "eval_sickr_spearman": 0.7508546947362507, | |
| "eval_stsb_spearman": 0.7933951500280679, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_avg_sts": 0.7736414601237904, | |
| "eval_sickr_spearman": 0.7518223773369244, | |
| "eval_stsb_spearman": 0.7954605429106565, | |
| "step": 1625 | |
| }, | |
| { | |
| "epoch": 0.11, | |
| "eval_avg_sts": 0.7750895970401648, | |
| "eval_sickr_spearman": 0.7527568224154028, | |
| "eval_stsb_spearman": 0.7974223716649267, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 0.12, | |
| "eval_avg_sts": 0.7776564224610277, | |
| "eval_sickr_spearman": 0.7542352378193863, | |
| "eval_stsb_spearman": 0.8010776071026692, | |
| "step": 1875 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "learning_rate": 6.55202867016511e-06, | |
| "loss": 0.0001, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "eval_avg_sts": 0.7785919822208553, | |
| "eval_sickr_spearman": 0.7546353668237488, | |
| "eval_stsb_spearman": 0.802548597617962, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "eval_avg_sts": 0.7804785012417673, | |
| "eval_sickr_spearman": 0.7560601133857076, | |
| "eval_stsb_spearman": 0.8048968890978271, | |
| "step": 2125 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "eval_avg_sts": 0.7791958793390172, | |
| "eval_sickr_spearman": 0.7571627153503209, | |
| "eval_stsb_spearman": 0.8012290433277136, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 0.15, | |
| "eval_avg_sts": 0.7808643358009081, | |
| "eval_sickr_spearman": 0.757428807652288, | |
| "eval_stsb_spearman": 0.8042998639495281, | |
| "step": 2375 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "learning_rate": 6.440035837706387e-06, | |
| "loss": 0.0005, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "eval_avg_sts": 0.7997499220712412, | |
| "eval_sickr_spearman": 0.7682156324132593, | |
| "eval_stsb_spearman": 0.8312842117292232, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "eval_avg_sts": 0.8000945443564438, | |
| "eval_sickr_spearman": 0.769006603032424, | |
| "eval_stsb_spearman": 0.8311824856804637, | |
| "step": 2625 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "eval_avg_sts": 0.8015655863550484, | |
| "eval_sickr_spearman": 0.7697635307193054, | |
| "eval_stsb_spearman": 0.8333676419907914, | |
| "step": 2750 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "eval_avg_sts": 0.8020135971999303, | |
| "eval_sickr_spearman": 0.7738109675441908, | |
| "eval_stsb_spearman": 0.8302162268556699, | |
| "step": 2875 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "learning_rate": 6.328043005247664e-06, | |
| "loss": 0.0001, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "eval_avg_sts": 0.8021055052889553, | |
| "eval_sickr_spearman": 0.7723527913356312, | |
| "eval_stsb_spearman": 0.8318582192422794, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 0.2, | |
| "eval_avg_sts": 0.8034828561746414, | |
| "eval_sickr_spearman": 0.7730187425570707, | |
| "eval_stsb_spearman": 0.8339469697922121, | |
| "step": 3125 | |
| }, | |
| { | |
| "epoch": 0.21, | |
| "eval_avg_sts": 0.809294388946485, | |
| "eval_sickr_spearman": 0.7739637544778655, | |
| "eval_stsb_spearman": 0.8446250234151045, | |
| "step": 3250 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_avg_sts": 0.8095468267478854, | |
| "eval_sickr_spearman": 0.7742509804644655, | |
| "eval_stsb_spearman": 0.8448426730313053, | |
| "step": 3375 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "learning_rate": 6.2160501727889415e-06, | |
| "loss": 0.0001, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_avg_sts": 0.8075109934505635, | |
| "eval_sickr_spearman": 0.7709388998025974, | |
| "eval_stsb_spearman": 0.8440830870985296, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 0.23, | |
| "eval_avg_sts": 0.8072613664062491, | |
| "eval_sickr_spearman": 0.7727868483993274, | |
| "eval_stsb_spearman": 0.8417358844131708, | |
| "step": 3625 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "eval_avg_sts": 0.8035650181540979, | |
| "eval_sickr_spearman": 0.7687000741023642, | |
| "eval_stsb_spearman": 0.8384299622058315, | |
| "step": 3750 | |
| }, | |
| { | |
| "epoch": 0.25, | |
| "eval_avg_sts": 0.8060855472554131, | |
| "eval_sickr_spearman": 0.7709744428176617, | |
| "eval_stsb_spearman": 0.8411966516931645, | |
| "step": 3875 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "learning_rate": 6.104057340330219e-06, | |
| "loss": 0.0004, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "eval_avg_sts": 0.803351813599069, | |
| "eval_sickr_spearman": 0.7677387500328843, | |
| "eval_stsb_spearman": 0.8389648771652538, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "eval_avg_sts": 0.802660483963512, | |
| "eval_sickr_spearman": 0.7673760487601211, | |
| "eval_stsb_spearman": 0.8379449191669028, | |
| "step": 4125 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "eval_avg_sts": 0.8047314511229144, | |
| "eval_sickr_spearman": 0.7691939779184522, | |
| "eval_stsb_spearman": 0.8402689243273768, | |
| "step": 4250 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "eval_avg_sts": 0.8040567267552472, | |
| "eval_sickr_spearman": 0.7695367278583146, | |
| "eval_stsb_spearman": 0.8385767256521798, | |
| "step": 4375 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "learning_rate": 5.992064507871497e-06, | |
| "loss": 0.0003, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "eval_avg_sts": 0.8031439674900422, | |
| "eval_sickr_spearman": 0.7708419250087939, | |
| "eval_stsb_spearman": 0.8354460099712906, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "eval_avg_sts": 0.8016452961027151, | |
| "eval_sickr_spearman": 0.76836294380137, | |
| "eval_stsb_spearman": 0.8349276484040601, | |
| "step": 4625 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "eval_avg_sts": 0.8036856358976682, | |
| "eval_sickr_spearman": 0.7702216513648221, | |
| "eval_stsb_spearman": 0.8371496204305142, | |
| "step": 4750 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "eval_avg_sts": 0.8061976413597232, | |
| "eval_sickr_spearman": 0.7719798778640656, | |
| "eval_stsb_spearman": 0.8404154048553806, | |
| "step": 4875 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "learning_rate": 5.880071675412773e-06, | |
| "loss": 0.0001, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "eval_avg_sts": 0.8067273899585344, | |
| "eval_sickr_spearman": 0.7723029350523384, | |
| "eval_stsb_spearman": 0.8411518448647305, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 0.33, | |
| "eval_avg_sts": 0.8078358230567408, | |
| "eval_sickr_spearman": 0.7726999601368258, | |
| "eval_stsb_spearman": 0.8429716859766557, | |
| "step": 5125 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_avg_sts": 0.802548441043093, | |
| "eval_sickr_spearman": 0.7676195664444124, | |
| "eval_stsb_spearman": 0.8374773156417734, | |
| "step": 5250 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_avg_sts": 0.800628830120568, | |
| "eval_sickr_spearman": 0.7634932625509655, | |
| "eval_stsb_spearman": 0.8377643976901704, | |
| "step": 5375 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "learning_rate": 5.7680788429540505e-06, | |
| "loss": 0.0002, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "eval_avg_sts": 0.8020238168463023, | |
| "eval_sickr_spearman": 0.7652266089396642, | |
| "eval_stsb_spearman": 0.8388210247529404, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "eval_avg_sts": 0.8040364434874829, | |
| "eval_sickr_spearman": 0.7675117846527851, | |
| "eval_stsb_spearman": 0.8405611023221807, | |
| "step": 5625 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "eval_avg_sts": 0.8016723711497669, | |
| "eval_sickr_spearman": 0.7650260310600586, | |
| "eval_stsb_spearman": 0.8383187112394752, | |
| "step": 5750 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "eval_avg_sts": 0.8020864629480828, | |
| "eval_sickr_spearman": 0.7653134972021658, | |
| "eval_stsb_spearman": 0.8388594286939999, | |
| "step": 5875 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "learning_rate": 5.656086010495328e-06, | |
| "loss": 0.0001, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "eval_avg_sts": 0.8028151558848002, | |
| "eval_sickr_spearman": 0.7671768637824573, | |
| "eval_stsb_spearman": 0.838453447987143, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 0.39, | |
| "eval_avg_sts": 0.8049514040827435, | |
| "eval_sickr_spearman": 0.7685626571211498, | |
| "eval_stsb_spearman": 0.8413401510443372, | |
| "step": 6125 | |
| }, | |
| { | |
| "epoch": 0.4, | |
| "eval_avg_sts": 0.8059812583547672, | |
| "eval_sickr_spearman": 0.7690958503782142, | |
| "eval_stsb_spearman": 0.8428666663313202, | |
| "step": 6250 | |
| }, | |
| { | |
| "epoch": 0.41, | |
| "eval_avg_sts": 0.8063265220940947, | |
| "eval_sickr_spearman": 0.7693663135104123, | |
| "eval_stsb_spearman": 0.8432867306777773, | |
| "step": 6375 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "learning_rate": 5.544093178036605e-06, | |
| "loss": 0.0001, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "eval_avg_sts": 0.8061105071256144, | |
| "eval_sickr_spearman": 0.769672271626573, | |
| "eval_stsb_spearman": 0.8425487426246557, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "eval_avg_sts": 0.8069978292318387, | |
| "eval_sickr_spearman": 0.770697879735581, | |
| "eval_stsb_spearman": 0.8432977787280964, | |
| "step": 6625 | |
| }, | |
| { | |
| "epoch": 0.43, | |
| "eval_avg_sts": 0.8080712074218199, | |
| "eval_sickr_spearman": 0.7709677664945618, | |
| "eval_stsb_spearman": 0.8451746483490781, | |
| "step": 6750 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_avg_sts": 0.808918715708319, | |
| "eval_sickr_spearman": 0.7720352577240238, | |
| "eval_stsb_spearman": 0.8458021736926141, | |
| "step": 6875 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "learning_rate": 5.432100345577883e-06, | |
| "loss": 0.0001, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "eval_avg_sts": 0.8006026057334057, | |
| "eval_sickr_spearman": 0.7608432425913206, | |
| "eval_stsb_spearman": 0.8403619688754909, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "eval_avg_sts": 0.8020612965823335, | |
| "eval_sickr_spearman": 0.7626692409746934, | |
| "eval_stsb_spearman": 0.8414533521899736, | |
| "step": 7125 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "eval_avg_sts": 0.810499992265102, | |
| "eval_sickr_spearman": 0.7673374317545649, | |
| "eval_stsb_spearman": 0.8536625527756392, | |
| "step": 7250 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "eval_avg_sts": 0.8112538171528675, | |
| "eval_sickr_spearman": 0.7687574232374812, | |
| "eval_stsb_spearman": 0.8537502110682538, | |
| "step": 7375 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "learning_rate": 5.32010751311916e-06, | |
| "loss": 0.0002, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "eval_avg_sts": 0.8149817134253148, | |
| "eval_sickr_spearman": 0.7774900538521474, | |
| "eval_stsb_spearman": 0.852473372998482, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 0.49, | |
| "eval_avg_sts": 0.8174625453813287, | |
| "eval_sickr_spearman": 0.7815984901758593, | |
| "eval_stsb_spearman": 0.8533266005867981, | |
| "step": 7625 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "eval_avg_sts": 0.8176977199916579, | |
| "eval_sickr_spearman": 0.782115160734029, | |
| "eval_stsb_spearman": 0.8532802792492867, | |
| "step": 7750 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "eval_avg_sts": 0.8178800789250669, | |
| "eval_sickr_spearman": 0.782127648820403, | |
| "eval_stsb_spearman": 0.8536325090297309, | |
| "step": 7875 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "learning_rate": 5.2081146806604376e-06, | |
| "loss": 0.0001, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "eval_avg_sts": 0.8181362028628546, | |
| "eval_sickr_spearman": 0.7824101677590619, | |
| "eval_stsb_spearman": 0.8538622379666473, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 0.52, | |
| "eval_avg_sts": 0.8182071435777255, | |
| "eval_sickr_spearman": 0.7826502752351511, | |
| "eval_stsb_spearman": 0.8537640119202999, | |
| "step": 8125 | |
| }, | |
| { | |
| "epoch": 0.53, | |
| "eval_avg_sts": 0.8175148093264073, | |
| "eval_sickr_spearman": 0.7809989179366073, | |
| "eval_stsb_spearman": 0.8540307007162073, | |
| "step": 8250 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "eval_avg_sts": 0.817271425771201, | |
| "eval_sickr_spearman": 0.7809910408359715, | |
| "eval_stsb_spearman": 0.8535518107064306, | |
| "step": 8375 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "learning_rate": 5.096121848201715e-06, | |
| "loss": 0.0, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "eval_avg_sts": 0.8169878861543607, | |
| "eval_sickr_spearman": 0.7807656308769224, | |
| "eval_stsb_spearman": 0.8532101414317989, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 0.55, | |
| "eval_avg_sts": 0.8163714998445242, | |
| "eval_sickr_spearman": 0.7799410809585343, | |
| "eval_stsb_spearman": 0.852801918730514, | |
| "step": 8625 | |
| }, | |
| { | |
| "epoch": 0.56, | |
| "eval_avg_sts": 0.814914066335918, | |
| "eval_sickr_spearman": 0.7796482833641676, | |
| "eval_stsb_spearman": 0.8501798493076684, | |
| "step": 8750 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "eval_avg_sts": 0.8150768291940962, | |
| "eval_sickr_spearman": 0.7799102930225125, | |
| "eval_stsb_spearman": 0.8502433653656799, | |
| "step": 8875 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "learning_rate": 4.984129015742992e-06, | |
| "loss": 0.0001, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "eval_avg_sts": 0.8157444131185677, | |
| "eval_sickr_spearman": 0.7805133715321694, | |
| "eval_stsb_spearman": 0.850975454704966, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "eval_avg_sts": 0.8194025294491036, | |
| "eval_sickr_spearman": 0.7869190393754633, | |
| "eval_stsb_spearman": 0.851886019522744, | |
| "step": 9125 | |
| }, | |
| { | |
| "epoch": 0.59, | |
| "eval_avg_sts": 0.6858142517829269, | |
| "eval_sickr_spearman": 0.6164898018315937, | |
| "eval_stsb_spearman": 0.7551387017342599, | |
| "step": 9250 | |
| }, | |
| { | |
| "epoch": 0.6, | |
| "eval_avg_sts": 0.8177747035338222, | |
| "eval_sickr_spearman": 0.783078280380066, | |
| "eval_stsb_spearman": 0.8524711266875784, | |
| "step": 9375 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "learning_rate": 4.872136183284269e-06, | |
| "loss": 0.0015, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "eval_avg_sts": 0.819985242900733, | |
| "eval_sickr_spearman": 0.7850574019148235, | |
| "eval_stsb_spearman": 0.8549130838866427, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 0.62, | |
| "eval_avg_sts": 0.820612467391125, | |
| "eval_sickr_spearman": 0.7860280624437863, | |
| "eval_stsb_spearman": 0.8551968723384636, | |
| "step": 9625 | |
| }, | |
| { | |
| "epoch": 0.62, | |
| "eval_avg_sts": 0.8210179120381628, | |
| "eval_sickr_spearman": 0.7866489124609753, | |
| "eval_stsb_spearman": 0.8553869116153502, | |
| "step": 9750 | |
| }, | |
| { | |
| "epoch": 0.63, | |
| "eval_avg_sts": 0.821463549997331, | |
| "eval_sickr_spearman": 0.787914243797261, | |
| "eval_stsb_spearman": 0.8550128561974009, | |
| "step": 9875 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "learning_rate": 4.760143350825547e-06, | |
| "loss": 0.0002, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "eval_avg_sts": 0.8220538798411258, | |
| "eval_sickr_spearman": 0.7882646787133534, | |
| "eval_stsb_spearman": 0.8558430809688982, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 0.65, | |
| "eval_avg_sts": 0.8227053843456922, | |
| "eval_sickr_spearman": 0.7892594508552383, | |
| "eval_stsb_spearman": 0.856151317836146, | |
| "step": 10125 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "eval_avg_sts": 0.8211210354889169, | |
| "eval_sickr_spearman": 0.7858874273787755, | |
| "eval_stsb_spearman": 0.8563546435990582, | |
| "step": 10250 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "eval_avg_sts": 0.8217109523377687, | |
| "eval_sickr_spearman": 0.7865405062650296, | |
| "eval_stsb_spearman": 0.8568813984105078, | |
| "step": 10375 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "learning_rate": 4.648150518366825e-06, | |
| "loss": 0.0002, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "eval_avg_sts": 0.8231847712907092, | |
| "eval_sickr_spearman": 0.7883226042216879, | |
| "eval_stsb_spearman": 0.8580469383597307, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 0.68, | |
| "eval_avg_sts": 0.8231833094531285, | |
| "eval_sickr_spearman": 0.7886680439032306, | |
| "eval_stsb_spearman": 0.8576985750030263, | |
| "step": 10625 | |
| }, | |
| { | |
| "epoch": 0.69, | |
| "eval_avg_sts": 0.8235797750151058, | |
| "eval_sickr_spearman": 0.7894692507063199, | |
| "eval_stsb_spearman": 0.8576902993238917, | |
| "step": 10750 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "eval_avg_sts": 0.8239802387430818, | |
| "eval_sickr_spearman": 0.7900059982648908, | |
| "eval_stsb_spearman": 0.8579544792212728, | |
| "step": 10875 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "learning_rate": 4.536157685908102e-06, | |
| "loss": 0.0001, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "eval_avg_sts": 0.8228846723006884, | |
| "eval_sickr_spearman": 0.7878013707088813, | |
| "eval_stsb_spearman": 0.8579679738924955, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "eval_avg_sts": 0.8233402178257747, | |
| "eval_sickr_spearman": 0.788485765873273, | |
| "eval_stsb_spearman": 0.8581946697782764, | |
| "step": 11125 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "eval_avg_sts": 0.8233165033728497, | |
| "eval_sickr_spearman": 0.788493306756199, | |
| "eval_stsb_spearman": 0.8581396999895003, | |
| "step": 11250 | |
| }, | |
| { | |
| "epoch": 0.73, | |
| "eval_avg_sts": 0.8211286933035429, | |
| "eval_sickr_spearman": 0.787368274267214, | |
| "eval_stsb_spearman": 0.8548891123398719, | |
| "step": 11375 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "learning_rate": 4.424164853449379e-06, | |
| "loss": 0.0002, | |
| "step": 11500 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "eval_avg_sts": 0.8222354006770852, | |
| "eval_sickr_spearman": 0.7882437371531265, | |
| "eval_stsb_spearman": 0.856227064201044, | |
| "step": 11500 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "eval_avg_sts": 0.823058736106017, | |
| "eval_sickr_spearman": 0.7882230837795081, | |
| "eval_stsb_spearman": 0.8578943884325259, | |
| "step": 11625 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "eval_avg_sts": 0.8240623262398707, | |
| "eval_sickr_spearman": 0.7903270861780045, | |
| "eval_stsb_spearman": 0.8577975663017371, | |
| "step": 11750 | |
| }, | |
| { | |
| "epoch": 0.76, | |
| "eval_avg_sts": 0.8193741224170432, | |
| "eval_sickr_spearman": 0.7834559008995725, | |
| "eval_stsb_spearman": 0.8552923439345139, | |
| "step": 11875 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "learning_rate": 4.312172020990656e-06, | |
| "loss": 0.0004, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "eval_avg_sts": 0.8219118427006455, | |
| "eval_sickr_spearman": 0.785794199010884, | |
| "eval_stsb_spearman": 0.8580294863904071, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "eval_avg_sts": 0.823098023008008, | |
| "eval_sickr_spearman": 0.7879260114171134, | |
| "eval_stsb_spearman": 0.8582700345989028, | |
| "step": 12125 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "eval_avg_sts": 0.8227772117211238, | |
| "eval_sickr_spearman": 0.7878058376013152, | |
| "eval_stsb_spearman": 0.8577485858409325, | |
| "step": 12250 | |
| }, | |
| { | |
| "epoch": 0.79, | |
| "eval_avg_sts": 0.8244800942376741, | |
| "eval_sickr_spearman": 0.7899311658088503, | |
| "eval_stsb_spearman": 0.8590290226664979, | |
| "step": 12375 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "learning_rate": 4.2001791885319345e-06, | |
| "loss": 0.0003, | |
| "step": 12500 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "eval_avg_sts": 0.8252546537289246, | |
| "eval_sickr_spearman": 0.7905314585146238, | |
| "eval_stsb_spearman": 0.8599778489432254, | |
| "step": 12500 | |
| }, | |
| { | |
| "epoch": 0.81, | |
| "eval_avg_sts": 0.8242515246774704, | |
| "eval_sickr_spearman": 0.7934860436884877, | |
| "eval_stsb_spearman": 0.855017005666453, | |
| "step": 12625 | |
| }, | |
| { | |
| "epoch": 0.82, | |
| "eval_avg_sts": 0.8251886392831695, | |
| "eval_sickr_spearman": 0.7935808570827266, | |
| "eval_stsb_spearman": 0.8567964214836123, | |
| "step": 12750 | |
| }, | |
| { | |
| "epoch": 0.82, | |
| "eval_avg_sts": 0.8255732979417849, | |
| "eval_sickr_spearman": 0.7939037701776952, | |
| "eval_stsb_spearman": 0.8572428257058746, | |
| "step": 12875 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "learning_rate": 4.088186356073212e-06, | |
| "loss": 0.0002, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_avg_sts": 0.8272525514506217, | |
| "eval_sickr_spearman": 0.7954193915835747, | |
| "eval_stsb_spearman": 0.8590857113176686, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 0.84, | |
| "eval_avg_sts": 0.8276110249953785, | |
| "eval_sickr_spearman": 0.7955957617880555, | |
| "eval_stsb_spearman": 0.8596262882027015, | |
| "step": 13125 | |
| }, | |
| { | |
| "epoch": 0.85, | |
| "eval_avg_sts": 0.8262806808137206, | |
| "eval_sickr_spearman": 0.792061729406442, | |
| "eval_stsb_spearman": 0.8604996322209992, | |
| "step": 13250 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "eval_avg_sts": 0.8270413161061019, | |
| "eval_sickr_spearman": 0.7918599027181991, | |
| "eval_stsb_spearman": 0.8622227294940048, | |
| "step": 13375 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "learning_rate": 3.976193523614489e-06, | |
| "loss": 0.0002, | |
| "step": 13500 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "eval_avg_sts": 0.8277173388272963, | |
| "eval_sickr_spearman": 0.7929541472711621, | |
| "eval_stsb_spearman": 0.8624805303834304, | |
| "step": 13500 | |
| }, | |
| { | |
| "epoch": 0.87, | |
| "eval_avg_sts": 0.8280371802211439, | |
| "eval_sickr_spearman": 0.7936189937772684, | |
| "eval_stsb_spearman": 0.8624553666650194, | |
| "step": 13625 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "eval_avg_sts": 0.8280087430461096, | |
| "eval_sickr_spearman": 0.7934894538966899, | |
| "eval_stsb_spearman": 0.8625280321955292, | |
| "step": 13750 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "eval_avg_sts": 0.8279846750031183, | |
| "eval_sickr_spearman": 0.7941465193643633, | |
| "eval_stsb_spearman": 0.8618228306418733, | |
| "step": 13875 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "learning_rate": 3.864200691155766e-06, | |
| "loss": 0.0001, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "eval_avg_sts": 0.8281003824811937, | |
| "eval_sickr_spearman": 0.7943439752223754, | |
| "eval_stsb_spearman": 0.8618567897400118, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "eval_avg_sts": 0.8280440185035953, | |
| "eval_sickr_spearman": 0.792904915392188, | |
| "eval_stsb_spearman": 0.8631831216150027, | |
| "step": 14125 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "eval_avg_sts": 0.8279193239585301, | |
| "eval_sickr_spearman": 0.7931221120328913, | |
| "eval_stsb_spearman": 0.8627165358841689, | |
| "step": 14250 | |
| }, | |
| { | |
| "epoch": 0.92, | |
| "eval_avg_sts": 0.8275099017452278, | |
| "eval_sickr_spearman": 0.793065195177687, | |
| "eval_stsb_spearman": 0.8619546083127685, | |
| "step": 14375 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "learning_rate": 3.7522078586970435e-06, | |
| "loss": 0.0001, | |
| "step": 14500 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "eval_avg_sts": 0.8275982959975564, | |
| "eval_sickr_spearman": 0.7935053521912658, | |
| "eval_stsb_spearman": 0.861691239803847, | |
| "step": 14500 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "eval_avg_sts": 0.8276150816017793, | |
| "eval_sickr_spearman": 0.7940267778284781, | |
| "eval_stsb_spearman": 0.8612033853750805, | |
| "step": 14625 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "eval_avg_sts": 0.8277678050001869, | |
| "eval_sickr_spearman": 0.7940122244047422, | |
| "eval_stsb_spearman": 0.8615233855956315, | |
| "step": 14750 | |
| }, | |
| { | |
| "epoch": 0.95, | |
| "eval_avg_sts": 0.827775044421294, | |
| "eval_sickr_spearman": 0.79435247672733, | |
| "eval_stsb_spearman": 0.861197612115258, | |
| "step": 14875 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "learning_rate": 3.6402150262383203e-06, | |
| "loss": 0.0002, | |
| "step": 15000 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "eval_avg_sts": 0.8265288786526938, | |
| "eval_sickr_spearman": 0.7941830230014563, | |
| "eval_stsb_spearman": 0.8588747343039312, | |
| "step": 15000 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_avg_sts": 0.826595528411173, | |
| "eval_sickr_spearman": 0.7947538726420482, | |
| "eval_stsb_spearman": 0.8584371841802979, | |
| "step": 15125 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "eval_avg_sts": 0.8271259707838263, | |
| "eval_sickr_spearman": 0.7952840399397222, | |
| "eval_stsb_spearman": 0.8589679016279306, | |
| "step": 15250 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "eval_avg_sts": 0.8269049666463504, | |
| "eval_sickr_spearman": 0.7927316191781993, | |
| "eval_stsb_spearman": 0.8610783141145013, | |
| "step": 15375 | |
| }, | |
| { | |
| "epoch": 0.99, | |
| "learning_rate": 3.5282221937795976e-06, | |
| "loss": 0.0003, | |
| "step": 15500 | |
| }, | |
| { | |
| "epoch": 0.99, | |
| "eval_avg_sts": 0.82737580758211, | |
| "eval_sickr_spearman": 0.7935406550508229, | |
| "eval_stsb_spearman": 0.8612109601133972, | |
| "step": 15500 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_avg_sts": 0.8264028870845463, | |
| "eval_sickr_spearman": 0.7940738673657366, | |
| "eval_stsb_spearman": 0.8587319068033561, | |
| "step": 15625 | |
| }, | |
| { | |
| "epoch": 1.01, | |
| "eval_avg_sts": 0.8268441102829658, | |
| "eval_sickr_spearman": 0.7937048253555384, | |
| "eval_stsb_spearman": 0.8599833952103932, | |
| "step": 15750 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_avg_sts": 0.8275739286019619, | |
| "eval_sickr_spearman": 0.7947639591733503, | |
| "eval_stsb_spearman": 0.8603838980305735, | |
| "step": 15875 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "learning_rate": 3.4162293613208757e-06, | |
| "loss": 0.0001, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_avg_sts": 0.8277768410299685, | |
| "eval_sickr_spearman": 0.7952131460339995, | |
| "eval_stsb_spearman": 0.8603405360259375, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 1.03, | |
| "eval_avg_sts": 0.8282682698041279, | |
| "eval_sickr_spearman": 0.7963400997670419, | |
| "eval_stsb_spearman": 0.860196439841214, | |
| "step": 16125 | |
| }, | |
| { | |
| "epoch": 1.04, | |
| "eval_avg_sts": 0.8264618348746703, | |
| "eval_sickr_spearman": 0.7934643816617393, | |
| "eval_stsb_spearman": 0.8594592880876013, | |
| "step": 16250 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "eval_avg_sts": 0.8264717428559492, | |
| "eval_sickr_spearman": 0.7932766280862176, | |
| "eval_stsb_spearman": 0.8596668576256806, | |
| "step": 16375 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "learning_rate": 3.304236528862153e-06, | |
| "loss": 0.0002, | |
| "step": 16500 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "eval_avg_sts": 0.8274883631622513, | |
| "eval_sickr_spearman": 0.7946689056236043, | |
| "eval_stsb_spearman": 0.8603078207008983, | |
| "step": 16500 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "eval_avg_sts": 0.8285054599151072, | |
| "eval_sickr_spearman": 0.7953375465867241, | |
| "eval_stsb_spearman": 0.8616733732434904, | |
| "step": 16625 | |
| }, | |
| { | |
| "epoch": 1.07, | |
| "eval_avg_sts": 0.8267040342845151, | |
| "eval_sickr_spearman": 0.7930167317963359, | |
| "eval_stsb_spearman": 0.8603913367726943, | |
| "step": 16750 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "eval_avg_sts": 0.8254063226482575, | |
| "eval_sickr_spearman": 0.7925604363326739, | |
| "eval_stsb_spearman": 0.8582522089638411, | |
| "step": 16875 | |
| }, | |
| { | |
| "epoch": 1.09, | |
| "learning_rate": 3.19224369640343e-06, | |
| "loss": 0.0003, | |
| "step": 17000 | |
| }, | |
| { | |
| "epoch": 1.09, | |
| "eval_avg_sts": 0.8263459648804743, | |
| "eval_sickr_spearman": 0.7938006474029073, | |
| "eval_stsb_spearman": 0.8588912823580412, | |
| "step": 17000 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "eval_avg_sts": 0.8265585284525776, | |
| "eval_sickr_spearman": 0.7938499273129829, | |
| "eval_stsb_spearman": 0.8592671295921722, | |
| "step": 17125 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "eval_avg_sts": 0.8275713806370856, | |
| "eval_sickr_spearman": 0.795413819975808, | |
| "eval_stsb_spearman": 0.8597289412983632, | |
| "step": 17250 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "eval_avg_sts": 0.8278030720022054, | |
| "eval_sickr_spearman": 0.7957596439061624, | |
| "eval_stsb_spearman": 0.8598465000982485, | |
| "step": 17375 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 3.0802508639447074e-06, | |
| "loss": 0.0003, | |
| "step": 17500 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "eval_avg_sts": 0.828665230451958, | |
| "eval_sickr_spearman": 0.7959547942713053, | |
| "eval_stsb_spearman": 0.8613756666326104, | |
| "step": 17500 | |
| }, | |
| { | |
| "epoch": 1.13, | |
| "eval_avg_sts": 0.8288773890103436, | |
| "eval_sickr_spearman": 0.7964317911396872, | |
| "eval_stsb_spearman": 0.861322986881, | |
| "step": 17625 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_avg_sts": 0.8287921576974288, | |
| "eval_sickr_spearman": 0.7965225699214054, | |
| "eval_stsb_spearman": 0.8610617454734522, | |
| "step": 17750 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_avg_sts": 0.8287755856452497, | |
| "eval_sickr_spearman": 0.7967101794036225, | |
| "eval_stsb_spearman": 0.8608409918868768, | |
| "step": 17875 | |
| }, | |
| { | |
| "epoch": 1.15, | |
| "learning_rate": 2.9682580314859847e-06, | |
| "loss": 0.0001, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 1.15, | |
| "eval_avg_sts": 0.8292774010789281, | |
| "eval_sickr_spearman": 0.7969440428365246, | |
| "eval_stsb_spearman": 0.8616107593213317, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 1.16, | |
| "eval_avg_sts": 0.8293137062967321, | |
| "eval_sickr_spearman": 0.7971494238262741, | |
| "eval_stsb_spearman": 0.8614779887671901, | |
| "step": 18125 | |
| }, | |
| { | |
| "epoch": 1.17, | |
| "eval_avg_sts": 0.8293003591512393, | |
| "eval_sickr_spearman": 0.7972976478053122, | |
| "eval_stsb_spearman": 0.8613030704971664, | |
| "step": 18250 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "eval_avg_sts": 0.8269276043107123, | |
| "eval_sickr_spearman": 0.7936150552269506, | |
| "eval_stsb_spearman": 0.8602401533944739, | |
| "step": 18375 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "learning_rate": 2.8562651990272623e-06, | |
| "loss": 0.0001, | |
| "step": 18500 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "eval_avg_sts": 0.8271598852494388, | |
| "eval_sickr_spearman": 0.7938677468516165, | |
| "eval_stsb_spearman": 0.8604520236472611, | |
| "step": 18500 | |
| }, | |
| { | |
| "epoch": 1.19, | |
| "eval_avg_sts": 0.8273011691673453, | |
| "eval_sickr_spearman": 0.7941100157272702, | |
| "eval_stsb_spearman": 0.8604923226074204, | |
| "step": 18625 | |
| }, | |
| { | |
| "epoch": 1.2, | |
| "eval_avg_sts": 0.8274659412451935, | |
| "eval_sickr_spearman": 0.7943473373994759, | |
| "eval_stsb_spearman": 0.860584545090911, | |
| "step": 18750 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "eval_avg_sts": 0.8273871753451842, | |
| "eval_sickr_spearman": 0.7941770191137765, | |
| "eval_stsb_spearman": 0.8605973315765919, | |
| "step": 18875 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "learning_rate": 2.7442723665685396e-06, | |
| "loss": 0.0002, | |
| "step": 19000 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "eval_avg_sts": 0.8268924907436139, | |
| "eval_sickr_spearman": 0.7941484406084208, | |
| "eval_stsb_spearman": 0.859636540878807, | |
| "step": 19000 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "eval_avg_sts": 0.8258034139625235, | |
| "eval_sickr_spearman": 0.7932116900370734, | |
| "eval_stsb_spearman": 0.8583951378879737, | |
| "step": 19125 | |
| }, | |
| { | |
| "epoch": 1.23, | |
| "eval_avg_sts": 0.8252544789859086, | |
| "eval_sickr_spearman": 0.7925500616147634, | |
| "eval_stsb_spearman": 0.857958896357054, | |
| "step": 19250 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "eval_avg_sts": 0.8253536873185088, | |
| "eval_sickr_spearman": 0.7926197067118486, | |
| "eval_stsb_spearman": 0.858087667925169, | |
| "step": 19375 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "learning_rate": 2.632279534109817e-06, | |
| "loss": 0.0002, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "eval_avg_sts": 0.8259692031147807, | |
| "eval_sickr_spearman": 0.7942922457261266, | |
| "eval_stsb_spearman": 0.8576461605034348, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 1.26, | |
| "eval_avg_sts": 0.8262977896726795, | |
| "eval_sickr_spearman": 0.7945857637870148, | |
| "eval_stsb_spearman": 0.8580098155583442, | |
| "step": 19625 | |
| }, | |
| { | |
| "epoch": 1.26, | |
| "eval_avg_sts": 0.8265435124446001, | |
| "eval_sickr_spearman": 0.7949808676274447, | |
| "eval_stsb_spearman": 0.8581061572617555, | |
| "step": 19750 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "eval_avg_sts": 0.82660901551375, | |
| "eval_sickr_spearman": 0.795241820601558, | |
| "eval_stsb_spearman": 0.8579762104259421, | |
| "step": 19875 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "learning_rate": 2.5202867016510945e-06, | |
| "loss": 0.0001, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "eval_avg_sts": 0.8249759667991925, | |
| "eval_sickr_spearman": 0.7929103429066506, | |
| "eval_stsb_spearman": 0.8570415906917342, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 1.29, | |
| "eval_avg_sts": 0.8252695158247048, | |
| "eval_sickr_spearman": 0.7941818702550217, | |
| "eval_stsb_spearman": 0.8563571613943879, | |
| "step": 20125 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "eval_avg_sts": 0.8254168575586551, | |
| "eval_sickr_spearman": 0.794336146152841, | |
| "eval_stsb_spearman": 0.8564975689644694, | |
| "step": 20250 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "eval_avg_sts": 0.8259865535716795, | |
| "eval_sickr_spearman": 0.7950048831781639, | |
| "eval_stsb_spearman": 0.8569682239651952, | |
| "step": 20375 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "learning_rate": 2.4082938691923718e-06, | |
| "loss": 0.0001, | |
| "step": 20500 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "eval_avg_sts": 0.826209318888689, | |
| "eval_sickr_spearman": 0.7952033957204077, | |
| "eval_stsb_spearman": 0.8572152420569702, | |
| "step": 20500 | |
| }, | |
| { | |
| "epoch": 1.32, | |
| "eval_avg_sts": 0.8259891403986184, | |
| "eval_sickr_spearman": 0.7948762078574111, | |
| "eval_stsb_spearman": 0.8571020729398255, | |
| "step": 20625 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "eval_avg_sts": 0.8259890083537097, | |
| "eval_sickr_spearman": 0.7947911447767642, | |
| "eval_stsb_spearman": 0.8571868719306552, | |
| "step": 20750 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "eval_avg_sts": 0.8261152907691348, | |
| "eval_sickr_spearman": 0.7949135280232285, | |
| "eval_stsb_spearman": 0.8573170535150412, | |
| "step": 20875 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "learning_rate": 2.296301036733649e-06, | |
| "loss": 0.0001, | |
| "step": 21000 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "eval_avg_sts": 0.826274962054796, | |
| "eval_sickr_spearman": 0.7950501284757184, | |
| "eval_stsb_spearman": 0.8574997956338737, | |
| "step": 21000 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "eval_avg_sts": 0.8260486313726075, | |
| "eval_sickr_spearman": 0.794899647034913, | |
| "eval_stsb_spearman": 0.8571976157103021, | |
| "step": 21125 | |
| }, | |
| { | |
| "epoch": 1.36, | |
| "eval_avg_sts": 0.825587114078729, | |
| "eval_sickr_spearman": 0.7946725559873136, | |
| "eval_stsb_spearman": 0.8565016721701444, | |
| "step": 21250 | |
| }, | |
| { | |
| "epoch": 1.37, | |
| "eval_avg_sts": 0.8256303672089018, | |
| "eval_sickr_spearman": 0.7944853787850091, | |
| "eval_stsb_spearman": 0.8567753556327944, | |
| "step": 21375 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "learning_rate": 2.1843082042749267e-06, | |
| "loss": 0.0002, | |
| "step": 21500 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "eval_avg_sts": 0.8254654257169443, | |
| "eval_sickr_spearman": 0.7936856129149631, | |
| "eval_stsb_spearman": 0.8572452385189255, | |
| "step": 21500 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "eval_avg_sts": 0.8257646791990041, | |
| "eval_sickr_spearman": 0.7941317738162218, | |
| "eval_stsb_spearman": 0.8573975845817864, | |
| "step": 21625 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "eval_avg_sts": 0.8263390736725806, | |
| "eval_sickr_spearman": 0.7947459955414125, | |
| "eval_stsb_spearman": 0.8579321518037489, | |
| "step": 21750 | |
| }, | |
| { | |
| "epoch": 1.4, | |
| "eval_avg_sts": 0.825957826826842, | |
| "eval_sickr_spearman": 0.7945194808670303, | |
| "eval_stsb_spearman": 0.8573961727866538, | |
| "step": 21875 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "learning_rate": 2.072315371816204e-06, | |
| "loss": 0.0001, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "eval_avg_sts": 0.8257198535359889, | |
| "eval_sickr_spearman": 0.7936219236744562, | |
| "eval_stsb_spearman": 0.8578177833975217, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "eval_avg_sts": 0.8270054813778303, | |
| "eval_sickr_spearman": 0.7958380306637094, | |
| "eval_stsb_spearman": 0.858172932091951, | |
| "step": 22125 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "eval_avg_sts": 0.8270091578481822, | |
| "eval_sickr_spearman": 0.7962583028012928, | |
| "eval_stsb_spearman": 0.8577600128950715, | |
| "step": 22250 | |
| }, | |
| { | |
| "epoch": 1.43, | |
| "eval_avg_sts": 0.8259725703398417, | |
| "eval_sickr_spearman": 0.7959245346773993, | |
| "eval_stsb_spearman": 0.8560206060022842, | |
| "step": 22375 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "learning_rate": 1.9603225393574807e-06, | |
| "loss": 0.0002, | |
| "step": 22500 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_avg_sts": 0.8254714237214871, | |
| "eval_sickr_spearman": 0.7955676635937141, | |
| "eval_stsb_spearman": 0.8553751838492601, | |
| "step": 22500 | |
| }, | |
| { | |
| "epoch": 1.45, | |
| "eval_avg_sts": 0.8243312613565763, | |
| "eval_sickr_spearman": 0.7926490056837258, | |
| "eval_stsb_spearman": 0.8560135170294269, | |
| "step": 22625 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "eval_avg_sts": 0.8244931271533935, | |
| "eval_sickr_spearman": 0.7931114971594734, | |
| "eval_stsb_spearman": 0.8558747571473136, | |
| "step": 22750 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "eval_avg_sts": 0.8245178381258861, | |
| "eval_sickr_spearman": 0.7931850518122927, | |
| "eval_stsb_spearman": 0.8558506244394795, | |
| "step": 22875 | |
| }, | |
| { | |
| "epoch": 1.47, | |
| "learning_rate": 1.8483297068987584e-06, | |
| "loss": 0.0002, | |
| "step": 23000 | |
| }, | |
| { | |
| "epoch": 1.47, | |
| "eval_avg_sts": 0.8250123369922542, | |
| "eval_sickr_spearman": 0.7931228324994128, | |
| "eval_stsb_spearman": 0.8569018414850956, | |
| "step": 23000 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "eval_avg_sts": 0.8254867372327745, | |
| "eval_sickr_spearman": 0.7938168819151935, | |
| "eval_stsb_spearman": 0.8571565925503556, | |
| "step": 23125 | |
| }, | |
| { | |
| "epoch": 1.49, | |
| "eval_avg_sts": 0.8256499116596692, | |
| "eval_sickr_spearman": 0.7939716381240272, | |
| "eval_stsb_spearman": 0.8573281851953113, | |
| "step": 23250 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "eval_avg_sts": 0.8258346679802114, | |
| "eval_sickr_spearman": 0.7940527146232547, | |
| "eval_stsb_spearman": 0.8576166213371682, | |
| "step": 23375 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "learning_rate": 1.7363368744400357e-06, | |
| "loss": 0.0001, | |
| "step": 23500 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "eval_avg_sts": 0.825945269207895, | |
| "eval_sickr_spearman": 0.7943781253354978, | |
| "eval_stsb_spearman": 0.8575124130802922, | |
| "step": 23500 | |
| }, | |
| { | |
| "epoch": 1.51, | |
| "eval_avg_sts": 0.8258713568091718, | |
| "eval_sickr_spearman": 0.794315540810324, | |
| "eval_stsb_spearman": 0.8574271728080196, | |
| "step": 23625 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "eval_avg_sts": 0.8258355435328646, | |
| "eval_sickr_spearman": 0.7940151062708286, | |
| "eval_stsb_spearman": 0.8576559807949005, | |
| "step": 23750 | |
| }, | |
| { | |
| "epoch": 1.53, | |
| "eval_avg_sts": 0.8257865803230886, | |
| "eval_sickr_spearman": 0.7940416194388225, | |
| "eval_stsb_spearman": 0.8575315412073548, | |
| "step": 23875 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "learning_rate": 1.6243440419813131e-06, | |
| "loss": 0.0002, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "eval_avg_sts": 0.8258057571249391, | |
| "eval_sickr_spearman": 0.7941539161539849, | |
| "eval_stsb_spearman": 0.8574575980958933, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "eval_avg_sts": 0.8258599414659757, | |
| "eval_sickr_spearman": 0.7942335517201692, | |
| "eval_stsb_spearman": 0.8574863312117823, | |
| "step": 24125 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "eval_avg_sts": 0.8259837419138151, | |
| "eval_sickr_spearman": 0.7943245706573944, | |
| "eval_stsb_spearman": 0.8576429131702358, | |
| "step": 24250 | |
| }, | |
| { | |
| "epoch": 1.56, | |
| "eval_avg_sts": 0.8273046944370666, | |
| "eval_sickr_spearman": 0.7953777005875265, | |
| "eval_stsb_spearman": 0.8592316882866066, | |
| "step": 24375 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "learning_rate": 1.5123512095225906e-06, | |
| "loss": 0.0001, | |
| "step": 24500 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "eval_avg_sts": 0.8270336322444836, | |
| "eval_sickr_spearman": 0.7948833644915253, | |
| "eval_stsb_spearman": 0.8591838999974419, | |
| "step": 24500 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_avg_sts": 0.8268251999183458, | |
| "eval_sickr_spearman": 0.7944777418398805, | |
| "eval_stsb_spearman": 0.8591726579968111, | |
| "step": 24625 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_avg_sts": 0.8267020534374147, | |
| "eval_sickr_spearman": 0.7943936393812624, | |
| "eval_stsb_spearman": 0.8590104674935669, | |
| "step": 24750 | |
| }, | |
| { | |
| "epoch": 1.59, | |
| "eval_avg_sts": 0.825917107993902, | |
| "eval_sickr_spearman": 0.7938579965380246, | |
| "eval_stsb_spearman": 0.8579762194497796, | |
| "step": 24875 | |
| }, | |
| { | |
| "epoch": 1.6, | |
| "learning_rate": 1.4003583770638678e-06, | |
| "loss": 0.0002, | |
| "step": 25000 | |
| }, | |
| { | |
| "epoch": 1.6, | |
| "eval_avg_sts": 0.8263527703022291, | |
| "eval_sickr_spearman": 0.7941290360434399, | |
| "eval_stsb_spearman": 0.8585765045610182, | |
| "step": 25000 | |
| }, | |
| { | |
| "epoch": 1.61, | |
| "eval_avg_sts": 0.8269584920385149, | |
| "eval_sickr_spearman": 0.7941601601971716, | |
| "eval_stsb_spearman": 0.8597568238798581, | |
| "step": 25125 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_avg_sts": 0.8264998215853827, | |
| "eval_sickr_spearman": 0.7927663936956405, | |
| "eval_stsb_spearman": 0.8602332494751249, | |
| "step": 25250 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_avg_sts": 0.825942745088348, | |
| "eval_sickr_spearman": 0.7922521246925426, | |
| "eval_stsb_spearman": 0.8596333654841534, | |
| "step": 25375 | |
| }, | |
| { | |
| "epoch": 1.63, | |
| "learning_rate": 1.2883655446051453e-06, | |
| "loss": 0.0001, | |
| "step": 25500 | |
| }, | |
| { | |
| "epoch": 1.63, | |
| "eval_avg_sts": 0.8259010696773026, | |
| "eval_sickr_spearman": 0.7922646127789166, | |
| "eval_stsb_spearman": 0.8595375265756887, | |
| "step": 25500 | |
| }, | |
| { | |
| "epoch": 1.64, | |
| "eval_avg_sts": 0.8259285307896478, | |
| "eval_sickr_spearman": 0.7926812825838921, | |
| "eval_stsb_spearman": 0.8591757789954035, | |
| "step": 25625 | |
| }, | |
| { | |
| "epoch": 1.65, | |
| "eval_avg_sts": 0.8258391793675839, | |
| "eval_sickr_spearman": 0.7926954517588166, | |
| "eval_stsb_spearman": 0.858982906976351, | |
| "step": 25750 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_avg_sts": 0.8258409312899861, | |
| "eval_sickr_spearman": 0.7928338293620596, | |
| "eval_stsb_spearman": 0.8588480332179126, | |
| "step": 25875 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "learning_rate": 1.1763727121464225e-06, | |
| "loss": 0.0001, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_avg_sts": 0.8251984305884675, | |
| "eval_sickr_spearman": 0.7933060231202977, | |
| "eval_stsb_spearman": 0.8570908380566373, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "eval_avg_sts": 0.8253196217152283, | |
| "eval_sickr_spearman": 0.7932125065657978, | |
| "eval_stsb_spearman": 0.8574267368646588, | |
| "step": 26125 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "eval_avg_sts": 0.8253745698430313, | |
| "eval_sickr_spearman": 0.7933913263564519, | |
| "eval_stsb_spearman": 0.8573578133296105, | |
| "step": 26250 | |
| }, | |
| { | |
| "epoch": 1.69, | |
| "eval_avg_sts": 0.825411316540875, | |
| "eval_sickr_spearman": 0.7934114513879544, | |
| "eval_stsb_spearman": 0.8574111816937955, | |
| "step": 26375 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "learning_rate": 1.0643798796877e-06, | |
| "loss": 0.0001, | |
| "step": 26500 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "eval_avg_sts": 0.8249370852399975, | |
| "eval_sickr_spearman": 0.7937128945805799, | |
| "eval_stsb_spearman": 0.8561612758994152, | |
| "step": 26500 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "eval_avg_sts": 0.825459765367129, | |
| "eval_sickr_spearman": 0.7933420944774778, | |
| "eval_stsb_spearman": 0.8575774362567802, | |
| "step": 26625 | |
| }, | |
| { | |
| "epoch": 1.71, | |
| "eval_avg_sts": 0.826427995376563, | |
| "eval_sickr_spearman": 0.7947685701590883, | |
| "eval_stsb_spearman": 0.8580874205940376, | |
| "step": 26750 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "eval_avg_sts": 0.8258856380174763, | |
| "eval_sickr_spearman": 0.7942930142237495, | |
| "eval_stsb_spearman": 0.857478261811203, | |
| "step": 26875 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "learning_rate": 9.523870472289774e-07, | |
| "loss": 0.0002, | |
| "step": 27000 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "eval_avg_sts": 0.8258593024414255, | |
| "eval_sickr_spearman": 0.7941693821686479, | |
| "eval_stsb_spearman": 0.8575492227142031, | |
| "step": 27000 | |
| }, | |
| { | |
| "epoch": 1.74, | |
| "eval_avg_sts": 0.8258720619743833, | |
| "eval_sickr_spearman": 0.7941788923267327, | |
| "eval_stsb_spearman": 0.857565231622034, | |
| "step": 27125 | |
| }, | |
| { | |
| "epoch": 1.74, | |
| "eval_avg_sts": 0.8259531389747516, | |
| "eval_sickr_spearman": 0.7941532917496662, | |
| "eval_stsb_spearman": 0.8577529861998372, | |
| "step": 27250 | |
| }, | |
| { | |
| "epoch": 1.75, | |
| "eval_avg_sts": 0.825969657799255, | |
| "eval_sickr_spearman": 0.7942109771024933, | |
| "eval_stsb_spearman": 0.8577283384960166, | |
| "step": 27375 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "learning_rate": 8.403942147702547e-07, | |
| "loss": 0.0002, | |
| "step": 27500 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "eval_avg_sts": 0.8259987251545413, | |
| "eval_sickr_spearman": 0.7943161171835413, | |
| "eval_stsb_spearman": 0.8576813331255413, | |
| "step": 27500 | |
| }, | |
| { | |
| "epoch": 1.77, | |
| "eval_avg_sts": 0.8252131722274082, | |
| "eval_sickr_spearman": 0.793231382788663, | |
| "eval_stsb_spearman": 0.8571949616661534, | |
| "step": 27625 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "eval_avg_sts": 0.8252604604270115, | |
| "eval_sickr_spearman": 0.7933024207876899, | |
| "eval_stsb_spearman": 0.857218500066333, | |
| "step": 27750 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "eval_avg_sts": 0.8251969961170478, | |
| "eval_sickr_spearman": 0.793198385421975, | |
| "eval_stsb_spearman": 0.8571956068121205, | |
| "step": 27875 | |
| }, | |
| { | |
| "epoch": 1.79, | |
| "learning_rate": 7.284013823115321e-07, | |
| "loss": 0.0002, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 1.79, | |
| "eval_avg_sts": 0.825311717070901, | |
| "eval_sickr_spearman": 0.7931744179023573, | |
| "eval_stsb_spearman": 0.8574490162394447, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_avg_sts": 0.8256482381761492, | |
| "eval_sickr_spearman": 0.7934648139416521, | |
| "eval_stsb_spearman": 0.8578316624106462, | |
| "step": 28125 | |
| }, | |
| { | |
| "epoch": 1.81, | |
| "eval_avg_sts": 0.8261129479959839, | |
| "eval_sickr_spearman": 0.7939418588411357, | |
| "eval_stsb_spearman": 0.858284037150832, | |
| "step": 28250 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "eval_avg_sts": 0.8262712326490254, | |
| "eval_sickr_spearman": 0.7933230261302068, | |
| "eval_stsb_spearman": 0.8592194391678438, | |
| "step": 28375 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "learning_rate": 6.164085498528094e-07, | |
| "loss": 0.0002, | |
| "step": 28500 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "eval_avg_sts": 0.8262943695062834, | |
| "eval_sickr_spearman": 0.7934199048618075, | |
| "eval_stsb_spearman": 0.8591688341507593, | |
| "step": 28500 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "eval_avg_sts": 0.8260598340905722, | |
| "eval_sickr_spearman": 0.7933951208134654, | |
| "eval_stsb_spearman": 0.8587245473676789, | |
| "step": 28625 | |
| }, | |
| { | |
| "epoch": 1.84, | |
| "eval_avg_sts": 0.8259360112469695, | |
| "eval_sickr_spearman": 0.7933420944774778, | |
| "eval_stsb_spearman": 0.8585299280164611, | |
| "step": 28750 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "eval_avg_sts": 0.8258330858999741, | |
| "eval_sickr_spearman": 0.7933054467470805, | |
| "eval_stsb_spearman": 0.8583607250528676, | |
| "step": 28875 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "learning_rate": 5.044157173940868e-07, | |
| "loss": 0.0001, | |
| "step": 29000 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "eval_avg_sts": 0.8258376969438936, | |
| "eval_sickr_spearman": 0.7933141884075422, | |
| "eval_stsb_spearman": 0.8583612054802452, | |
| "step": 29000 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "eval_avg_sts": 0.8259136180644091, | |
| "eval_sickr_spearman": 0.7933194718287004, | |
| "eval_stsb_spearman": 0.8585077643001178, | |
| "step": 29125 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "eval_avg_sts": 0.825910175107258, | |
| "eval_sickr_spearman": 0.7933039097518345, | |
| "eval_stsb_spearman": 0.8585164404626813, | |
| "step": 29250 | |
| }, | |
| { | |
| "epoch": 1.88, | |
| "eval_avg_sts": 0.8258308833879402, | |
| "eval_sickr_spearman": 0.7933173584602371, | |
| "eval_stsb_spearman": 0.8583444083156432, | |
| "step": 29375 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "learning_rate": 3.9242288493536413e-07, | |
| "loss": 0.0001, | |
| "step": 29500 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "eval_avg_sts": 0.8257221328599513, | |
| "eval_sickr_spearman": 0.7931374819853514, | |
| "eval_stsb_spearman": 0.8583067837345514, | |
| "step": 29500 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "eval_avg_sts": 0.825786763719202, | |
| "eval_sickr_spearman": 0.7932694234210019, | |
| "eval_stsb_spearman": 0.858304104017402, | |
| "step": 29625 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "eval_avg_sts": 0.8257681951340192, | |
| "eval_sickr_spearman": 0.7932804705743327, | |
| "eval_stsb_spearman": 0.8582559196937056, | |
| "step": 29750 | |
| }, | |
| { | |
| "epoch": 1.91, | |
| "eval_avg_sts": 0.8258082608558808, | |
| "eval_sickr_spearman": 0.7933519408532725, | |
| "eval_stsb_spearman": 0.8582645808584891, | |
| "step": 29875 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "learning_rate": 2.804300524766415e-07, | |
| "loss": 0.0001, | |
| "step": 30000 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "eval_avg_sts": 0.8258262861889483, | |
| "eval_sickr_spearman": 0.7933999719547107, | |
| "eval_stsb_spearman": 0.8582526004231857, | |
| "step": 30000 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "eval_avg_sts": 0.8256086631585, | |
| "eval_sickr_spearman": 0.7930556369885008, | |
| "eval_stsb_spearman": 0.8581616893284993, | |
| "step": 30125 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "eval_avg_sts": 0.8256480515518101, | |
| "eval_sickr_spearman": 0.7931325828130048, | |
| "eval_stsb_spearman": 0.8581635202906153, | |
| "step": 30250 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "eval_avg_sts": 0.8258219208455879, | |
| "eval_sickr_spearman": 0.7934267252782117, | |
| "eval_stsb_spearman": 0.8582171164129642, | |
| "step": 30375 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "learning_rate": 1.6843722001791884e-07, | |
| "loss": 0.0002, | |
| "step": 30500 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "eval_avg_sts": 0.8258322719939588, | |
| "eval_sickr_spearman": 0.7934731233222009, | |
| "eval_stsb_spearman": 0.8581914206657169, | |
| "step": 30500 | |
| }, | |
| { | |
| "epoch": 1.96, | |
| "eval_avg_sts": 0.8258242424865203, | |
| "eval_sickr_spearman": 0.7934302315486167, | |
| "eval_stsb_spearman": 0.858218253424424, | |
| "step": 30625 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "eval_avg_sts": 0.8258248316168127, | |
| "eval_sickr_spearman": 0.7934435841948165, | |
| "eval_stsb_spearman": 0.858206079038809, | |
| "step": 30750 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "eval_avg_sts": 0.8257922895919085, | |
| "eval_sickr_spearman": 0.7933790303944838, | |
| "eval_stsb_spearman": 0.8582055487893332, | |
| "step": 30875 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "learning_rate": 5.64443875591962e-08, | |
| "loss": 0.0001, | |
| "step": 31000 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "eval_avg_sts": 0.8257897415072173, | |
| "eval_sickr_spearman": 0.7933720178536738, | |
| "eval_stsb_spearman": 0.8582074651607609, | |
| "step": 31000 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "eval_avg_sts": 0.8257977713308224, | |
| "eval_sickr_spearman": 0.7933829209137002, | |
| "eval_stsb_spearman": 0.8582126217479447, | |
| "step": 31125 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_avg_sts": 0.8258126560134551, | |
| "eval_sickr_spearman": 0.7934017010743625, | |
| "eval_stsb_spearman": 0.8582236109525477, | |
| "step": 31250 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "step": 31252, | |
| "train_runtime": 21163.9877, | |
| "train_samples_per_second": 1.477 | |
| } | |
| ], | |
| "max_steps": 31252, | |
| "num_train_epochs": 2, | |
| "total_flos": 776159526314354880, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |