| { | |
| "best_metric": 0.8528364235468135, | |
| "best_model_checkpoint": "checkpoints/bert-large-uncased", | |
| "epoch": 3.0, | |
| "global_step": 3081, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.02, | |
| "eval_avg_sts": 0.7741718103390286, | |
| "eval_sickr_spearman": 0.745954513736433, | |
| "eval_stsb_spearman": 0.8023891069416242, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 0.05, | |
| "eval_avg_sts": 0.8081911987521978, | |
| "eval_sickr_spearman": 0.779239730815335, | |
| "eval_stsb_spearman": 0.8371426666890606, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.07, | |
| "eval_avg_sts": 0.8136161115454807, | |
| "eval_sickr_spearman": 0.7835086390489516, | |
| "eval_stsb_spearman": 0.8437235840420098, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_avg_sts": 0.8155047769520929, | |
| "eval_sickr_spearman": 0.7852900645701897, | |
| "eval_stsb_spearman": 0.845719489333996, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.12, | |
| "eval_avg_sts": 0.8238067491381542, | |
| "eval_sickr_spearman": 0.7985816632400571, | |
| "eval_stsb_spearman": 0.8490318350362512, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 0.15, | |
| "eval_avg_sts": 0.8224993495563874, | |
| "eval_sickr_spearman": 0.7982152819982874, | |
| "eval_stsb_spearman": 0.8467834171144873, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "eval_avg_sts": 0.8263297389680633, | |
| "eval_sickr_spearman": 0.8034025929225019, | |
| "eval_stsb_spearman": 0.8492568850136247, | |
| "step": 175 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "eval_avg_sts": 0.82711974150715, | |
| "eval_sickr_spearman": 0.8028132513078563, | |
| "eval_stsb_spearman": 0.8514262317064436, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_avg_sts": 0.8285051091857007, | |
| "eval_sickr_spearman": 0.8064033359848481, | |
| "eval_stsb_spearman": 0.8506068823865535, | |
| "step": 225 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "eval_avg_sts": 0.8308924909456856, | |
| "eval_sickr_spearman": 0.8108744071244177, | |
| "eval_stsb_spearman": 0.8509105747669534, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "eval_avg_sts": 0.8292742145946509, | |
| "eval_sickr_spearman": 0.8081889402119113, | |
| "eval_stsb_spearman": 0.8503594889773904, | |
| "step": 275 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "eval_avg_sts": 0.8302783515064169, | |
| "eval_sickr_spearman": 0.8108542340618137, | |
| "eval_stsb_spearman": 0.8497024689510201, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "eval_avg_sts": 0.8354548973044524, | |
| "eval_sickr_spearman": 0.8162711816820041, | |
| "eval_stsb_spearman": 0.8546386129269009, | |
| "step": 325 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_avg_sts": 0.8376245074641093, | |
| "eval_sickr_spearman": 0.820640234762119, | |
| "eval_stsb_spearman": 0.8546087801660995, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "eval_avg_sts": 0.842346577377938, | |
| "eval_sickr_spearman": 0.8251871470108594, | |
| "eval_stsb_spearman": 0.8595060077450167, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 0.39, | |
| "eval_avg_sts": 0.8392487017993179, | |
| "eval_sickr_spearman": 0.8222254052028811, | |
| "eval_stsb_spearman": 0.8562719983957546, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.41, | |
| "eval_avg_sts": 0.836585408133989, | |
| "eval_sickr_spearman": 0.8178774858073988, | |
| "eval_stsb_spearman": 0.855293330460579, | |
| "step": 425 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_avg_sts": 0.8377417996341128, | |
| "eval_sickr_spearman": 0.8186622659737961, | |
| "eval_stsb_spearman": 0.8568213332944294, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "eval_avg_sts": 0.8409718734645293, | |
| "eval_sickr_spearman": 0.8244389665437579, | |
| "eval_stsb_spearman": 0.8575047803853006, | |
| "step": 475 | |
| }, | |
| { | |
| "epoch": 0.49, | |
| "learning_rate": 8.377150275884453e-06, | |
| "loss": 0.5144, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.49, | |
| "eval_avg_sts": 0.8409672497360382, | |
| "eval_sickr_spearman": 0.8242925677465746, | |
| "eval_stsb_spearman": 0.8576419317255018, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "eval_avg_sts": 0.8413119218825833, | |
| "eval_sickr_spearman": 0.8241660538253865, | |
| "eval_stsb_spearman": 0.85845778993978, | |
| "step": 525 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "eval_avg_sts": 0.8405090163812534, | |
| "eval_sickr_spearman": 0.8231903980618742, | |
| "eval_stsb_spearman": 0.8578276347006326, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 0.56, | |
| "eval_avg_sts": 0.8461025764167975, | |
| "eval_sickr_spearman": 0.8310040496127249, | |
| "eval_stsb_spearman": 0.8612011032208701, | |
| "step": 575 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "eval_avg_sts": 0.8447104900811846, | |
| "eval_sickr_spearman": 0.8284478343941886, | |
| "eval_stsb_spearman": 0.8609731457681805, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "eval_avg_sts": 0.8462395445603483, | |
| "eval_sickr_spearman": 0.8308051047905681, | |
| "eval_stsb_spearman": 0.8616739843301284, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 0.63, | |
| "eval_avg_sts": 0.8436677522914944, | |
| "eval_sickr_spearman": 0.8276286639591616, | |
| "eval_stsb_spearman": 0.8597068406238272, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "eval_avg_sts": 0.8447115186169327, | |
| "eval_sickr_spearman": 0.8297105720509965, | |
| "eval_stsb_spearman": 0.8597124651828688, | |
| "step": 675 | |
| }, | |
| { | |
| "epoch": 0.68, | |
| "eval_avg_sts": 0.8434972279862564, | |
| "eval_sickr_spearman": 0.8294735385653995, | |
| "eval_stsb_spearman": 0.8575209174071132, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "eval_avg_sts": 0.8440935405127372, | |
| "eval_sickr_spearman": 0.8307528469522036, | |
| "eval_stsb_spearman": 0.8574342340732707, | |
| "step": 725 | |
| }, | |
| { | |
| "epoch": 0.73, | |
| "eval_avg_sts": 0.8430030266304707, | |
| "eval_sickr_spearman": 0.8273284695751733, | |
| "eval_stsb_spearman": 0.858677583685768, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "eval_avg_sts": 0.8459169389588843, | |
| "eval_sickr_spearman": 0.8317631811709543, | |
| "eval_stsb_spearman": 0.8600706967468144, | |
| "step": 775 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "eval_avg_sts": 0.8451542594549106, | |
| "eval_sickr_spearman": 0.8302367527672511, | |
| "eval_stsb_spearman": 0.8600717661425702, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "eval_avg_sts": 0.8441819324586433, | |
| "eval_sickr_spearman": 0.8280832303031719, | |
| "eval_stsb_spearman": 0.8602806346141146, | |
| "step": 825 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_avg_sts": 0.84041329364274, | |
| "eval_sickr_spearman": 0.8234209671109596, | |
| "eval_stsb_spearman": 0.8574056201745204, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 0.85, | |
| "eval_avg_sts": 0.8463098863081795, | |
| "eval_sickr_spearman": 0.8311718222500483, | |
| "eval_stsb_spearman": 0.8614479503663108, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "eval_avg_sts": 0.8489707536403015, | |
| "eval_sickr_spearman": 0.8359545191757484, | |
| "eval_stsb_spearman": 0.8619869881048546, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "eval_avg_sts": 0.8459381219997153, | |
| "eval_sickr_spearman": 0.8324996900804063, | |
| "eval_stsb_spearman": 0.8593765539190245, | |
| "step": 925 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "eval_avg_sts": 0.8441563920982813, | |
| "eval_sickr_spearman": 0.8308032796087136, | |
| "eval_stsb_spearman": 0.8575095045878491, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 0.95, | |
| "eval_avg_sts": 0.8417274944195297, | |
| "eval_sickr_spearman": 0.8286961551886236, | |
| "eval_stsb_spearman": 0.8547588336504358, | |
| "step": 975 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "learning_rate": 6.754300551768907e-06, | |
| "loss": 0.338, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_avg_sts": 0.8439797180911035, | |
| "eval_sickr_spearman": 0.8322901784159331, | |
| "eval_stsb_spearman": 0.8556692577662738, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_avg_sts": 0.846580279698808, | |
| "eval_sickr_spearman": 0.8351822751268263, | |
| "eval_stsb_spearman": 0.8579782842707896, | |
| "step": 1025 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_avg_sts": 0.8444154454958996, | |
| "eval_sickr_spearman": 0.8319871021658588, | |
| "eval_stsb_spearman": 0.8568437888259406, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "eval_avg_sts": 0.8432409670453203, | |
| "eval_sickr_spearman": 0.8314499703584763, | |
| "eval_stsb_spearman": 0.8550319637321643, | |
| "step": 1075 | |
| }, | |
| { | |
| "epoch": 1.07, | |
| "eval_avg_sts": 0.8446753892080279, | |
| "eval_sickr_spearman": 0.8331656893329471, | |
| "eval_stsb_spearman": 0.8561850890831085, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "eval_avg_sts": 0.8474510190292008, | |
| "eval_sickr_spearman": 0.8356278596548676, | |
| "eval_stsb_spearman": 0.8592741784035342, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "eval_avg_sts": 0.8505734569059473, | |
| "eval_sickr_spearman": 0.8389641479918606, | |
| "eval_stsb_spearman": 0.862182765820034, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_avg_sts": 0.8521021908496921, | |
| "eval_sickr_spearman": 0.8412426954129831, | |
| "eval_stsb_spearman": 0.862961686286401, | |
| "step": 1175 | |
| }, | |
| { | |
| "epoch": 1.17, | |
| "eval_avg_sts": 0.8514560490494238, | |
| "eval_sickr_spearman": 0.840301718104709, | |
| "eval_stsb_spearman": 0.8626103799941387, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 1.19, | |
| "eval_avg_sts": 0.8486972541916555, | |
| "eval_sickr_spearman": 0.8367856973861348, | |
| "eval_stsb_spearman": 0.8606088109971762, | |
| "step": 1225 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "eval_avg_sts": 0.848898608926278, | |
| "eval_sickr_spearman": 0.8370826736863266, | |
| "eval_stsb_spearman": 0.8607145441662293, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "eval_avg_sts": 0.8454701656945296, | |
| "eval_sickr_spearman": 0.8321730305595257, | |
| "eval_stsb_spearman": 0.8587673008295333, | |
| "step": 1275 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "eval_avg_sts": 0.8452672490522616, | |
| "eval_sickr_spearman": 0.833004064676608, | |
| "eval_stsb_spearman": 0.8575304334279151, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 1.29, | |
| "eval_avg_sts": 0.8489039116599046, | |
| "eval_sickr_spearman": 0.8371614927237867, | |
| "eval_stsb_spearman": 0.8606463305960226, | |
| "step": 1325 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "eval_avg_sts": 0.8467466937976185, | |
| "eval_sickr_spearman": 0.8343573409596268, | |
| "eval_stsb_spearman": 0.85913604663561, | |
| "step": 1350 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "eval_avg_sts": 0.8479786014484607, | |
| "eval_sickr_spearman": 0.8356114810492773, | |
| "eval_stsb_spearman": 0.8603457218476441, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 1.36, | |
| "eval_avg_sts": 0.8481320629670138, | |
| "eval_sickr_spearman": 0.8365469828119875, | |
| "eval_stsb_spearman": 0.8597171431220402, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "eval_avg_sts": 0.8493017107452288, | |
| "eval_sickr_spearman": 0.8375811404570515, | |
| "eval_stsb_spearman": 0.8610222810334061, | |
| "step": 1425 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "eval_avg_sts": 0.8515707185583519, | |
| "eval_sickr_spearman": 0.8413120523234598, | |
| "eval_stsb_spearman": 0.8618293847932439, | |
| "step": 1450 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_avg_sts": 0.8491061717045717, | |
| "eval_sickr_spearman": 0.8386661630385385, | |
| "eval_stsb_spearman": 0.8595461803706049, | |
| "step": 1475 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "learning_rate": 5.131450827653359e-06, | |
| "loss": 0.2965, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "eval_avg_sts": 0.849951123911407, | |
| "eval_sickr_spearman": 0.8403214588874001, | |
| "eval_stsb_spearman": 0.859580788935414, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "eval_avg_sts": 0.8462728434267617, | |
| "eval_sickr_spearman": 0.8349335220524785, | |
| "eval_stsb_spearman": 0.8576121648010449, | |
| "step": 1525 | |
| }, | |
| { | |
| "epoch": 1.51, | |
| "eval_avg_sts": 0.8478142980726532, | |
| "eval_sickr_spearman": 0.8355811253931684, | |
| "eval_stsb_spearman": 0.8600474707521379, | |
| "step": 1550 | |
| }, | |
| { | |
| "epoch": 1.53, | |
| "eval_avg_sts": 0.8506859270446779, | |
| "eval_sickr_spearman": 0.8387632819256463, | |
| "eval_stsb_spearman": 0.8626085721637096, | |
| "step": 1575 | |
| }, | |
| { | |
| "epoch": 1.56, | |
| "eval_avg_sts": 0.8491205822275252, | |
| "eval_sickr_spearman": 0.8368930468978489, | |
| "eval_stsb_spearman": 0.8613481175572015, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_avg_sts": 0.8460304537726628, | |
| "eval_sickr_spearman": 0.8335511389219881, | |
| "eval_stsb_spearman": 0.8585097686233377, | |
| "step": 1625 | |
| }, | |
| { | |
| "epoch": 1.61, | |
| "eval_avg_sts": 0.8488092782108085, | |
| "eval_sickr_spearman": 0.8360739244939235, | |
| "eval_stsb_spearman": 0.8615446319276937, | |
| "step": 1650 | |
| }, | |
| { | |
| "epoch": 1.63, | |
| "eval_avg_sts": 0.8483771836085118, | |
| "eval_sickr_spearman": 0.8353614791662919, | |
| "eval_stsb_spearman": 0.8613928880507317, | |
| "step": 1675 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_avg_sts": 0.8482633646541247, | |
| "eval_sickr_spearman": 0.835166232738946, | |
| "eval_stsb_spearman": 0.8613604965693032, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "eval_avg_sts": 0.8494820125153382, | |
| "eval_sickr_spearman": 0.8363321877263562, | |
| "eval_stsb_spearman": 0.8626318373043202, | |
| "step": 1725 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "eval_avg_sts": 0.84774811911999, | |
| "eval_sickr_spearman": 0.8350676729187949, | |
| "eval_stsb_spearman": 0.8604285653211853, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "eval_avg_sts": 0.8508953589183318, | |
| "eval_sickr_spearman": 0.8393342276284411, | |
| "eval_stsb_spearman": 0.8624564902082225, | |
| "step": 1775 | |
| }, | |
| { | |
| "epoch": 1.75, | |
| "eval_avg_sts": 0.8497877526052855, | |
| "eval_sickr_spearman": 0.8380021810922581, | |
| "eval_stsb_spearman": 0.861573324118313, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "eval_avg_sts": 0.847915612163006, | |
| "eval_sickr_spearman": 0.8351774720166826, | |
| "eval_stsb_spearman": 0.8606537523093295, | |
| "step": 1825 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_avg_sts": 0.8496201121858785, | |
| "eval_sickr_spearman": 0.8377723042407751, | |
| "eval_stsb_spearman": 0.861467920130982, | |
| "step": 1850 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "eval_avg_sts": 0.8506282266864784, | |
| "eval_sickr_spearman": 0.8396311078664301, | |
| "eval_stsb_spearman": 0.8616253455065267, | |
| "step": 1875 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "eval_avg_sts": 0.8507148324349076, | |
| "eval_sickr_spearman": 0.8398456147654526, | |
| "eval_stsb_spearman": 0.8615840501043628, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "eval_avg_sts": 0.8528364235468135, | |
| "eval_sickr_spearman": 0.8424179684340722, | |
| "eval_stsb_spearman": 0.8632548786595547, | |
| "step": 1925 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "eval_avg_sts": 0.8505338171378869, | |
| "eval_sickr_spearman": 0.8398606965313044, | |
| "eval_stsb_spearman": 0.8612069377444695, | |
| "step": 1950 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "eval_avg_sts": 0.8481722210917726, | |
| "eval_sickr_spearman": 0.8373791216444029, | |
| "eval_stsb_spearman": 0.8589653205391424, | |
| "step": 1975 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "learning_rate": 3.5086011035378126e-06, | |
| "loss": 0.284, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "eval_avg_sts": 0.8482272752573701, | |
| "eval_sickr_spearman": 0.8377695664679932, | |
| "eval_stsb_spearman": 0.858684984046747, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "eval_avg_sts": 0.8480501028062337, | |
| "eval_sickr_spearman": 0.837576385378009, | |
| "eval_stsb_spearman": 0.8585238202344584, | |
| "step": 2025 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_avg_sts": 0.8480832424004543, | |
| "eval_sickr_spearman": 0.8374597658637174, | |
| "eval_stsb_spearman": 0.8587067189371913, | |
| "step": 2050 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "eval_avg_sts": 0.8499478012984727, | |
| "eval_sickr_spearman": 0.8390217853135862, | |
| "eval_stsb_spearman": 0.8608738172833591, | |
| "step": 2075 | |
| }, | |
| { | |
| "epoch": 2.04, | |
| "eval_avg_sts": 0.8491869466527012, | |
| "eval_sickr_spearman": 0.8378290289715736, | |
| "eval_stsb_spearman": 0.8605448643338288, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 2.07, | |
| "eval_avg_sts": 0.8477584257424788, | |
| "eval_sickr_spearman": 0.8359002920622246, | |
| "eval_stsb_spearman": 0.8596165594227332, | |
| "step": 2125 | |
| }, | |
| { | |
| "epoch": 2.09, | |
| "eval_avg_sts": 0.848914705769936, | |
| "eval_sickr_spearman": 0.837553906822536, | |
| "eval_stsb_spearman": 0.860275504717336, | |
| "step": 2150 | |
| }, | |
| { | |
| "epoch": 2.12, | |
| "eval_avg_sts": 0.849736568959095, | |
| "eval_sickr_spearman": 0.8393637187247242, | |
| "eval_stsb_spearman": 0.860109419193466, | |
| "step": 2175 | |
| }, | |
| { | |
| "epoch": 2.14, | |
| "eval_avg_sts": 0.8495688115163362, | |
| "eval_sickr_spearman": 0.8389394600057214, | |
| "eval_stsb_spearman": 0.860198163026951, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 2.17, | |
| "eval_avg_sts": 0.8483895280681955, | |
| "eval_sickr_spearman": 0.8374167780279301, | |
| "eval_stsb_spearman": 0.8593622781084608, | |
| "step": 2225 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "eval_avg_sts": 0.8490834154561102, | |
| "eval_sickr_spearman": 0.8387396506237387, | |
| "eval_stsb_spearman": 0.8594271802884818, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "eval_avg_sts": 0.8485035624729105, | |
| "eval_sickr_spearman": 0.8381763418660725, | |
| "eval_stsb_spearman": 0.8588307830797486, | |
| "step": 2275 | |
| }, | |
| { | |
| "epoch": 2.24, | |
| "eval_avg_sts": 0.8476220200458998, | |
| "eval_sickr_spearman": 0.8364356947499554, | |
| "eval_stsb_spearman": 0.8588083453418442, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 2.26, | |
| "eval_avg_sts": 0.8471502937152022, | |
| "eval_sickr_spearman": 0.8358850662030688, | |
| "eval_stsb_spearman": 0.8584155212273358, | |
| "step": 2325 | |
| }, | |
| { | |
| "epoch": 2.29, | |
| "eval_avg_sts": 0.8481508305259742, | |
| "eval_sickr_spearman": 0.8369382921954037, | |
| "eval_stsb_spearman": 0.8593633688565446, | |
| "step": 2350 | |
| }, | |
| { | |
| "epoch": 2.31, | |
| "eval_avg_sts": 0.8478439833733975, | |
| "eval_sickr_spearman": 0.8367764273835573, | |
| "eval_stsb_spearman": 0.8589115393632376, | |
| "step": 2375 | |
| }, | |
| { | |
| "epoch": 2.34, | |
| "eval_avg_sts": 0.8466942437126351, | |
| "eval_sickr_spearman": 0.8354506248905611, | |
| "eval_stsb_spearman": 0.8579378625347092, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 2.36, | |
| "eval_avg_sts": 0.8477441088420843, | |
| "eval_sickr_spearman": 0.8366948705733154, | |
| "eval_stsb_spearman": 0.8587933471108533, | |
| "step": 2425 | |
| }, | |
| { | |
| "epoch": 2.39, | |
| "eval_avg_sts": 0.8488516946426614, | |
| "eval_sickr_spearman": 0.8377335431419145, | |
| "eval_stsb_spearman": 0.8599698461434083, | |
| "step": 2450 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "eval_avg_sts": 0.8480771808294114, | |
| "eval_sickr_spearman": 0.8370132207136473, | |
| "eval_stsb_spearman": 0.8591411409451756, | |
| "step": 2475 | |
| }, | |
| { | |
| "epoch": 2.43, | |
| "learning_rate": 1.8857513794222658e-06, | |
| "loss": 0.2655, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.43, | |
| "eval_avg_sts": 0.8487999481558521, | |
| "eval_sickr_spearman": 0.8377923812411763, | |
| "eval_stsb_spearman": 0.8598075150705279, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.46, | |
| "eval_avg_sts": 0.848399750999945, | |
| "eval_sickr_spearman": 0.8369205206878717, | |
| "eval_stsb_spearman": 0.8598789813120182, | |
| "step": 2525 | |
| }, | |
| { | |
| "epoch": 2.48, | |
| "eval_avg_sts": 0.8485584973593749, | |
| "eval_sickr_spearman": 0.8373407447943537, | |
| "eval_stsb_spearman": 0.8597762499243962, | |
| "step": 2550 | |
| }, | |
| { | |
| "epoch": 2.51, | |
| "eval_avg_sts": 0.8484553378772859, | |
| "eval_sickr_spearman": 0.8371878137673748, | |
| "eval_stsb_spearman": 0.8597228619871968, | |
| "step": 2575 | |
| }, | |
| { | |
| "epoch": 2.53, | |
| "eval_avg_sts": 0.8480636244098692, | |
| "eval_sickr_spearman": 0.8368399244996585, | |
| "eval_stsb_spearman": 0.8592873243200797, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 2.56, | |
| "eval_avg_sts": 0.8487639345972604, | |
| "eval_sickr_spearman": 0.8379995874127802, | |
| "eval_stsb_spearman": 0.8595282817817406, | |
| "step": 2625 | |
| }, | |
| { | |
| "epoch": 2.58, | |
| "eval_avg_sts": 0.8484073121905233, | |
| "eval_sickr_spearman": 0.8373334920980365, | |
| "eval_stsb_spearman": 0.85948113228301, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 2.6, | |
| "eval_avg_sts": 0.8495353514397407, | |
| "eval_sickr_spearman": 0.8388814384351839, | |
| "eval_stsb_spearman": 0.8601892644442974, | |
| "step": 2675 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "eval_avg_sts": 0.8488734860883285, | |
| "eval_sickr_spearman": 0.8376559248819906, | |
| "eval_stsb_spearman": 0.8600910472946663, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 2.65, | |
| "eval_avg_sts": 0.8485291479370792, | |
| "eval_sickr_spearman": 0.8370302717546578, | |
| "eval_stsb_spearman": 0.8600280241195006, | |
| "step": 2725 | |
| }, | |
| { | |
| "epoch": 2.68, | |
| "eval_avg_sts": 0.8484609936724099, | |
| "eval_sickr_spearman": 0.8370401181304525, | |
| "eval_stsb_spearman": 0.8598818692143673, | |
| "step": 2750 | |
| }, | |
| { | |
| "epoch": 2.7, | |
| "eval_avg_sts": 0.8487467947632423, | |
| "eval_sickr_spearman": 0.8374640886628467, | |
| "eval_stsb_spearman": 0.8600295008636379, | |
| "step": 2775 | |
| }, | |
| { | |
| "epoch": 2.73, | |
| "eval_avg_sts": 0.8487549703295775, | |
| "eval_sickr_spearman": 0.8377412761492462, | |
| "eval_stsb_spearman": 0.8597686645099087, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 2.75, | |
| "eval_avg_sts": 0.8483512050356906, | |
| "eval_sickr_spearman": 0.8371601478529463, | |
| "eval_stsb_spearman": 0.8595422622184349, | |
| "step": 2825 | |
| }, | |
| { | |
| "epoch": 2.78, | |
| "eval_avg_sts": 0.8487416863586705, | |
| "eval_sickr_spearman": 0.8376103433667258, | |
| "eval_stsb_spearman": 0.8598730293506154, | |
| "step": 2850 | |
| }, | |
| { | |
| "epoch": 2.8, | |
| "eval_avg_sts": 0.8486695192263061, | |
| "eval_sickr_spearman": 0.8374840215699435, | |
| "eval_stsb_spearman": 0.8598550168826687, | |
| "step": 2875 | |
| }, | |
| { | |
| "epoch": 2.82, | |
| "eval_avg_sts": 0.8490062168713867, | |
| "eval_sickr_spearman": 0.8380430075284804, | |
| "eval_stsb_spearman": 0.859969426214293, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 2.85, | |
| "eval_avg_sts": 0.8488936976734611, | |
| "eval_sickr_spearman": 0.8378850332358503, | |
| "eval_stsb_spearman": 0.859902362111072, | |
| "step": 2925 | |
| }, | |
| { | |
| "epoch": 2.87, | |
| "eval_avg_sts": 0.8489709020581676, | |
| "eval_sickr_spearman": 0.8379462248590827, | |
| "eval_stsb_spearman": 0.8599955792572526, | |
| "step": 2950 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "eval_avg_sts": 0.8487957508450565, | |
| "eval_sickr_spearman": 0.8376585185614683, | |
| "eval_stsb_spearman": 0.8599329831286449, | |
| "step": 2975 | |
| }, | |
| { | |
| "epoch": 2.92, | |
| "learning_rate": 2.6290165530671865e-07, | |
| "loss": 0.263, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 2.92, | |
| "eval_avg_sts": 0.8485199174178477, | |
| "eval_sickr_spearman": 0.837266008400516, | |
| "eval_stsb_spearman": 0.8597738264351793, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 2.95, | |
| "eval_avg_sts": 0.8483285540592784, | |
| "eval_sickr_spearman": 0.837077006016357, | |
| "eval_stsb_spearman": 0.8595801021021999, | |
| "step": 3025 | |
| }, | |
| { | |
| "epoch": 2.97, | |
| "eval_avg_sts": 0.8483039392081567, | |
| "eval_sickr_spearman": 0.8370466464338976, | |
| "eval_stsb_spearman": 0.8595612319824159, | |
| "step": 3050 | |
| }, | |
| { | |
| "epoch": 2.99, | |
| "eval_avg_sts": 0.8482931559093356, | |
| "eval_sickr_spearman": 0.837029215070426, | |
| "eval_stsb_spearman": 0.8595570967482453, | |
| "step": 3075 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "step": 3081, | |
| "train_runtime": 8699.7484, | |
| "train_samples_per_second": 0.354 | |
| } | |
| ], | |
| "max_steps": 3081, | |
| "num_train_epochs": 3, | |
| "total_flos": 333879495592513536, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |