| { |
| "best_metric": 0.8528364235468135, |
| "best_model_checkpoint": "checkpoints/bert-large-uncased", |
| "epoch": 3.0, |
| "global_step": 3081, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.02, |
| "eval_avg_sts": 0.7741718103390286, |
| "eval_sickr_spearman": 0.745954513736433, |
| "eval_stsb_spearman": 0.8023891069416242, |
| "step": 25 |
| }, |
| { |
| "epoch": 0.05, |
| "eval_avg_sts": 0.8081911987521978, |
| "eval_sickr_spearman": 0.779239730815335, |
| "eval_stsb_spearman": 0.8371426666890606, |
| "step": 50 |
| }, |
| { |
| "epoch": 0.07, |
| "eval_avg_sts": 0.8136161115454807, |
| "eval_sickr_spearman": 0.7835086390489516, |
| "eval_stsb_spearman": 0.8437235840420098, |
| "step": 75 |
| }, |
| { |
| "epoch": 0.1, |
| "eval_avg_sts": 0.8155047769520929, |
| "eval_sickr_spearman": 0.7852900645701897, |
| "eval_stsb_spearman": 0.845719489333996, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.12, |
| "eval_avg_sts": 0.8238067491381542, |
| "eval_sickr_spearman": 0.7985816632400571, |
| "eval_stsb_spearman": 0.8490318350362512, |
| "step": 125 |
| }, |
| { |
| "epoch": 0.15, |
| "eval_avg_sts": 0.8224993495563874, |
| "eval_sickr_spearman": 0.7982152819982874, |
| "eval_stsb_spearman": 0.8467834171144873, |
| "step": 150 |
| }, |
| { |
| "epoch": 0.17, |
| "eval_avg_sts": 0.8263297389680633, |
| "eval_sickr_spearman": 0.8034025929225019, |
| "eval_stsb_spearman": 0.8492568850136247, |
| "step": 175 |
| }, |
| { |
| "epoch": 0.19, |
| "eval_avg_sts": 0.82711974150715, |
| "eval_sickr_spearman": 0.8028132513078563, |
| "eval_stsb_spearman": 0.8514262317064436, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_avg_sts": 0.8285051091857007, |
| "eval_sickr_spearman": 0.8064033359848481, |
| "eval_stsb_spearman": 0.8506068823865535, |
| "step": 225 |
| }, |
| { |
| "epoch": 0.24, |
| "eval_avg_sts": 0.8308924909456856, |
| "eval_sickr_spearman": 0.8108744071244177, |
| "eval_stsb_spearman": 0.8509105747669534, |
| "step": 250 |
| }, |
| { |
| "epoch": 0.27, |
| "eval_avg_sts": 0.8292742145946509, |
| "eval_sickr_spearman": 0.8081889402119113, |
| "eval_stsb_spearman": 0.8503594889773904, |
| "step": 275 |
| }, |
| { |
| "epoch": 0.29, |
| "eval_avg_sts": 0.8302783515064169, |
| "eval_sickr_spearman": 0.8108542340618137, |
| "eval_stsb_spearman": 0.8497024689510201, |
| "step": 300 |
| }, |
| { |
| "epoch": 0.32, |
| "eval_avg_sts": 0.8354548973044524, |
| "eval_sickr_spearman": 0.8162711816820041, |
| "eval_stsb_spearman": 0.8546386129269009, |
| "step": 325 |
| }, |
| { |
| "epoch": 0.34, |
| "eval_avg_sts": 0.8376245074641093, |
| "eval_sickr_spearman": 0.820640234762119, |
| "eval_stsb_spearman": 0.8546087801660995, |
| "step": 350 |
| }, |
| { |
| "epoch": 0.37, |
| "eval_avg_sts": 0.842346577377938, |
| "eval_sickr_spearman": 0.8251871470108594, |
| "eval_stsb_spearman": 0.8595060077450167, |
| "step": 375 |
| }, |
| { |
| "epoch": 0.39, |
| "eval_avg_sts": 0.8392487017993179, |
| "eval_sickr_spearman": 0.8222254052028811, |
| "eval_stsb_spearman": 0.8562719983957546, |
| "step": 400 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_avg_sts": 0.836585408133989, |
| "eval_sickr_spearman": 0.8178774858073988, |
| "eval_stsb_spearman": 0.855293330460579, |
| "step": 425 |
| }, |
| { |
| "epoch": 0.44, |
| "eval_avg_sts": 0.8377417996341128, |
| "eval_sickr_spearman": 0.8186622659737961, |
| "eval_stsb_spearman": 0.8568213332944294, |
| "step": 450 |
| }, |
| { |
| "epoch": 0.46, |
| "eval_avg_sts": 0.8409718734645293, |
| "eval_sickr_spearman": 0.8244389665437579, |
| "eval_stsb_spearman": 0.8575047803853006, |
| "step": 475 |
| }, |
| { |
| "epoch": 0.49, |
| "learning_rate": 8.377150275884453e-06, |
| "loss": 0.5144, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.49, |
| "eval_avg_sts": 0.8409672497360382, |
| "eval_sickr_spearman": 0.8242925677465746, |
| "eval_stsb_spearman": 0.8576419317255018, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.51, |
| "eval_avg_sts": 0.8413119218825833, |
| "eval_sickr_spearman": 0.8241660538253865, |
| "eval_stsb_spearman": 0.85845778993978, |
| "step": 525 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_avg_sts": 0.8405090163812534, |
| "eval_sickr_spearman": 0.8231903980618742, |
| "eval_stsb_spearman": 0.8578276347006326, |
| "step": 550 |
| }, |
| { |
| "epoch": 0.56, |
| "eval_avg_sts": 0.8461025764167975, |
| "eval_sickr_spearman": 0.8310040496127249, |
| "eval_stsb_spearman": 0.8612011032208701, |
| "step": 575 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_avg_sts": 0.8447104900811846, |
| "eval_sickr_spearman": 0.8284478343941886, |
| "eval_stsb_spearman": 0.8609731457681805, |
| "step": 600 |
| }, |
| { |
| "epoch": 0.61, |
| "eval_avg_sts": 0.8462395445603483, |
| "eval_sickr_spearman": 0.8308051047905681, |
| "eval_stsb_spearman": 0.8616739843301284, |
| "step": 625 |
| }, |
| { |
| "epoch": 0.63, |
| "eval_avg_sts": 0.8436677522914944, |
| "eval_sickr_spearman": 0.8276286639591616, |
| "eval_stsb_spearman": 0.8597068406238272, |
| "step": 650 |
| }, |
| { |
| "epoch": 0.66, |
| "eval_avg_sts": 0.8447115186169327, |
| "eval_sickr_spearman": 0.8297105720509965, |
| "eval_stsb_spearman": 0.8597124651828688, |
| "step": 675 |
| }, |
| { |
| "epoch": 0.68, |
| "eval_avg_sts": 0.8434972279862564, |
| "eval_sickr_spearman": 0.8294735385653995, |
| "eval_stsb_spearman": 0.8575209174071132, |
| "step": 700 |
| }, |
| { |
| "epoch": 0.71, |
| "eval_avg_sts": 0.8440935405127372, |
| "eval_sickr_spearman": 0.8307528469522036, |
| "eval_stsb_spearman": 0.8574342340732707, |
| "step": 725 |
| }, |
| { |
| "epoch": 0.73, |
| "eval_avg_sts": 0.8430030266304707, |
| "eval_sickr_spearman": 0.8273284695751733, |
| "eval_stsb_spearman": 0.858677583685768, |
| "step": 750 |
| }, |
| { |
| "epoch": 0.75, |
| "eval_avg_sts": 0.8459169389588843, |
| "eval_sickr_spearman": 0.8317631811709543, |
| "eval_stsb_spearman": 0.8600706967468144, |
| "step": 775 |
| }, |
| { |
| "epoch": 0.78, |
| "eval_avg_sts": 0.8451542594549106, |
| "eval_sickr_spearman": 0.8302367527672511, |
| "eval_stsb_spearman": 0.8600717661425702, |
| "step": 800 |
| }, |
| { |
| "epoch": 0.8, |
| "eval_avg_sts": 0.8441819324586433, |
| "eval_sickr_spearman": 0.8280832303031719, |
| "eval_stsb_spearman": 0.8602806346141146, |
| "step": 825 |
| }, |
| { |
| "epoch": 0.83, |
| "eval_avg_sts": 0.84041329364274, |
| "eval_sickr_spearman": 0.8234209671109596, |
| "eval_stsb_spearman": 0.8574056201745204, |
| "step": 850 |
| }, |
| { |
| "epoch": 0.85, |
| "eval_avg_sts": 0.8463098863081795, |
| "eval_sickr_spearman": 0.8311718222500483, |
| "eval_stsb_spearman": 0.8614479503663108, |
| "step": 875 |
| }, |
| { |
| "epoch": 0.88, |
| "eval_avg_sts": 0.8489707536403015, |
| "eval_sickr_spearman": 0.8359545191757484, |
| "eval_stsb_spearman": 0.8619869881048546, |
| "step": 900 |
| }, |
| { |
| "epoch": 0.9, |
| "eval_avg_sts": 0.8459381219997153, |
| "eval_sickr_spearman": 0.8324996900804063, |
| "eval_stsb_spearman": 0.8593765539190245, |
| "step": 925 |
| }, |
| { |
| "epoch": 0.93, |
| "eval_avg_sts": 0.8441563920982813, |
| "eval_sickr_spearman": 0.8308032796087136, |
| "eval_stsb_spearman": 0.8575095045878491, |
| "step": 950 |
| }, |
| { |
| "epoch": 0.95, |
| "eval_avg_sts": 0.8417274944195297, |
| "eval_sickr_spearman": 0.8286961551886236, |
| "eval_stsb_spearman": 0.8547588336504358, |
| "step": 975 |
| }, |
| { |
| "epoch": 0.97, |
| "learning_rate": 6.754300551768907e-06, |
| "loss": 0.338, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.97, |
| "eval_avg_sts": 0.8439797180911035, |
| "eval_sickr_spearman": 0.8322901784159331, |
| "eval_stsb_spearman": 0.8556692577662738, |
| "step": 1000 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_avg_sts": 0.846580279698808, |
| "eval_sickr_spearman": 0.8351822751268263, |
| "eval_stsb_spearman": 0.8579782842707896, |
| "step": 1025 |
| }, |
| { |
| "epoch": 1.02, |
| "eval_avg_sts": 0.8444154454958996, |
| "eval_sickr_spearman": 0.8319871021658588, |
| "eval_stsb_spearman": 0.8568437888259406, |
| "step": 1050 |
| }, |
| { |
| "epoch": 1.05, |
| "eval_avg_sts": 0.8432409670453203, |
| "eval_sickr_spearman": 0.8314499703584763, |
| "eval_stsb_spearman": 0.8550319637321643, |
| "step": 1075 |
| }, |
| { |
| "epoch": 1.07, |
| "eval_avg_sts": 0.8446753892080279, |
| "eval_sickr_spearman": 0.8331656893329471, |
| "eval_stsb_spearman": 0.8561850890831085, |
| "step": 1100 |
| }, |
| { |
| "epoch": 1.1, |
| "eval_avg_sts": 0.8474510190292008, |
| "eval_sickr_spearman": 0.8356278596548676, |
| "eval_stsb_spearman": 0.8592741784035342, |
| "step": 1125 |
| }, |
| { |
| "epoch": 1.12, |
| "eval_avg_sts": 0.8505734569059473, |
| "eval_sickr_spearman": 0.8389641479918606, |
| "eval_stsb_spearman": 0.862182765820034, |
| "step": 1150 |
| }, |
| { |
| "epoch": 1.14, |
| "eval_avg_sts": 0.8521021908496921, |
| "eval_sickr_spearman": 0.8412426954129831, |
| "eval_stsb_spearman": 0.862961686286401, |
| "step": 1175 |
| }, |
| { |
| "epoch": 1.17, |
| "eval_avg_sts": 0.8514560490494238, |
| "eval_sickr_spearman": 0.840301718104709, |
| "eval_stsb_spearman": 0.8626103799941387, |
| "step": 1200 |
| }, |
| { |
| "epoch": 1.19, |
| "eval_avg_sts": 0.8486972541916555, |
| "eval_sickr_spearman": 0.8367856973861348, |
| "eval_stsb_spearman": 0.8606088109971762, |
| "step": 1225 |
| }, |
| { |
| "epoch": 1.22, |
| "eval_avg_sts": 0.848898608926278, |
| "eval_sickr_spearman": 0.8370826736863266, |
| "eval_stsb_spearman": 0.8607145441662293, |
| "step": 1250 |
| }, |
| { |
| "epoch": 1.24, |
| "eval_avg_sts": 0.8454701656945296, |
| "eval_sickr_spearman": 0.8321730305595257, |
| "eval_stsb_spearman": 0.8587673008295333, |
| "step": 1275 |
| }, |
| { |
| "epoch": 1.27, |
| "eval_avg_sts": 0.8452672490522616, |
| "eval_sickr_spearman": 0.833004064676608, |
| "eval_stsb_spearman": 0.8575304334279151, |
| "step": 1300 |
| }, |
| { |
| "epoch": 1.29, |
| "eval_avg_sts": 0.8489039116599046, |
| "eval_sickr_spearman": 0.8371614927237867, |
| "eval_stsb_spearman": 0.8606463305960226, |
| "step": 1325 |
| }, |
| { |
| "epoch": 1.31, |
| "eval_avg_sts": 0.8467466937976185, |
| "eval_sickr_spearman": 0.8343573409596268, |
| "eval_stsb_spearman": 0.85913604663561, |
| "step": 1350 |
| }, |
| { |
| "epoch": 1.34, |
| "eval_avg_sts": 0.8479786014484607, |
| "eval_sickr_spearman": 0.8356114810492773, |
| "eval_stsb_spearman": 0.8603457218476441, |
| "step": 1375 |
| }, |
| { |
| "epoch": 1.36, |
| "eval_avg_sts": 0.8481320629670138, |
| "eval_sickr_spearman": 0.8365469828119875, |
| "eval_stsb_spearman": 0.8597171431220402, |
| "step": 1400 |
| }, |
| { |
| "epoch": 1.39, |
| "eval_avg_sts": 0.8493017107452288, |
| "eval_sickr_spearman": 0.8375811404570515, |
| "eval_stsb_spearman": 0.8610222810334061, |
| "step": 1425 |
| }, |
| { |
| "epoch": 1.41, |
| "eval_avg_sts": 0.8515707185583519, |
| "eval_sickr_spearman": 0.8413120523234598, |
| "eval_stsb_spearman": 0.8618293847932439, |
| "step": 1450 |
| }, |
| { |
| "epoch": 1.44, |
| "eval_avg_sts": 0.8491061717045717, |
| "eval_sickr_spearman": 0.8386661630385385, |
| "eval_stsb_spearman": 0.8595461803706049, |
| "step": 1475 |
| }, |
| { |
| "epoch": 1.46, |
| "learning_rate": 5.131450827653359e-06, |
| "loss": 0.2965, |
| "step": 1500 |
| }, |
| { |
| "epoch": 1.46, |
| "eval_avg_sts": 0.849951123911407, |
| "eval_sickr_spearman": 0.8403214588874001, |
| "eval_stsb_spearman": 0.859580788935414, |
| "step": 1500 |
| }, |
| { |
| "epoch": 1.48, |
| "eval_avg_sts": 0.8462728434267617, |
| "eval_sickr_spearman": 0.8349335220524785, |
| "eval_stsb_spearman": 0.8576121648010449, |
| "step": 1525 |
| }, |
| { |
| "epoch": 1.51, |
| "eval_avg_sts": 0.8478142980726532, |
| "eval_sickr_spearman": 0.8355811253931684, |
| "eval_stsb_spearman": 0.8600474707521379, |
| "step": 1550 |
| }, |
| { |
| "epoch": 1.53, |
| "eval_avg_sts": 0.8506859270446779, |
| "eval_sickr_spearman": 0.8387632819256463, |
| "eval_stsb_spearman": 0.8626085721637096, |
| "step": 1575 |
| }, |
| { |
| "epoch": 1.56, |
| "eval_avg_sts": 0.8491205822275252, |
| "eval_sickr_spearman": 0.8368930468978489, |
| "eval_stsb_spearman": 0.8613481175572015, |
| "step": 1600 |
| }, |
| { |
| "epoch": 1.58, |
| "eval_avg_sts": 0.8460304537726628, |
| "eval_sickr_spearman": 0.8335511389219881, |
| "eval_stsb_spearman": 0.8585097686233377, |
| "step": 1625 |
| }, |
| { |
| "epoch": 1.61, |
| "eval_avg_sts": 0.8488092782108085, |
| "eval_sickr_spearman": 0.8360739244939235, |
| "eval_stsb_spearman": 0.8615446319276937, |
| "step": 1650 |
| }, |
| { |
| "epoch": 1.63, |
| "eval_avg_sts": 0.8483771836085118, |
| "eval_sickr_spearman": 0.8353614791662919, |
| "eval_stsb_spearman": 0.8613928880507317, |
| "step": 1675 |
| }, |
| { |
| "epoch": 1.66, |
| "eval_avg_sts": 0.8482633646541247, |
| "eval_sickr_spearman": 0.835166232738946, |
| "eval_stsb_spearman": 0.8613604965693032, |
| "step": 1700 |
| }, |
| { |
| "epoch": 1.68, |
| "eval_avg_sts": 0.8494820125153382, |
| "eval_sickr_spearman": 0.8363321877263562, |
| "eval_stsb_spearman": 0.8626318373043202, |
| "step": 1725 |
| }, |
| { |
| "epoch": 1.7, |
| "eval_avg_sts": 0.84774811911999, |
| "eval_sickr_spearman": 0.8350676729187949, |
| "eval_stsb_spearman": 0.8604285653211853, |
| "step": 1750 |
| }, |
| { |
| "epoch": 1.73, |
| "eval_avg_sts": 0.8508953589183318, |
| "eval_sickr_spearman": 0.8393342276284411, |
| "eval_stsb_spearman": 0.8624564902082225, |
| "step": 1775 |
| }, |
| { |
| "epoch": 1.75, |
| "eval_avg_sts": 0.8497877526052855, |
| "eval_sickr_spearman": 0.8380021810922581, |
| "eval_stsb_spearman": 0.861573324118313, |
| "step": 1800 |
| }, |
| { |
| "epoch": 1.78, |
| "eval_avg_sts": 0.847915612163006, |
| "eval_sickr_spearman": 0.8351774720166826, |
| "eval_stsb_spearman": 0.8606537523093295, |
| "step": 1825 |
| }, |
| { |
| "epoch": 1.8, |
| "eval_avg_sts": 0.8496201121858785, |
| "eval_sickr_spearman": 0.8377723042407751, |
| "eval_stsb_spearman": 0.861467920130982, |
| "step": 1850 |
| }, |
| { |
| "epoch": 1.83, |
| "eval_avg_sts": 0.8506282266864784, |
| "eval_sickr_spearman": 0.8396311078664301, |
| "eval_stsb_spearman": 0.8616253455065267, |
| "step": 1875 |
| }, |
| { |
| "epoch": 1.85, |
| "eval_avg_sts": 0.8507148324349076, |
| "eval_sickr_spearman": 0.8398456147654526, |
| "eval_stsb_spearman": 0.8615840501043628, |
| "step": 1900 |
| }, |
| { |
| "epoch": 1.87, |
| "eval_avg_sts": 0.8528364235468135, |
| "eval_sickr_spearman": 0.8424179684340722, |
| "eval_stsb_spearman": 0.8632548786595547, |
| "step": 1925 |
| }, |
| { |
| "epoch": 1.9, |
| "eval_avg_sts": 0.8505338171378869, |
| "eval_sickr_spearman": 0.8398606965313044, |
| "eval_stsb_spearman": 0.8612069377444695, |
| "step": 1950 |
| }, |
| { |
| "epoch": 1.92, |
| "eval_avg_sts": 0.8481722210917726, |
| "eval_sickr_spearman": 0.8373791216444029, |
| "eval_stsb_spearman": 0.8589653205391424, |
| "step": 1975 |
| }, |
| { |
| "epoch": 1.95, |
| "learning_rate": 3.5086011035378126e-06, |
| "loss": 0.284, |
| "step": 2000 |
| }, |
| { |
| "epoch": 1.95, |
| "eval_avg_sts": 0.8482272752573701, |
| "eval_sickr_spearman": 0.8377695664679932, |
| "eval_stsb_spearman": 0.858684984046747, |
| "step": 2000 |
| }, |
| { |
| "epoch": 1.97, |
| "eval_avg_sts": 0.8480501028062337, |
| "eval_sickr_spearman": 0.837576385378009, |
| "eval_stsb_spearman": 0.8585238202344584, |
| "step": 2025 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_avg_sts": 0.8480832424004543, |
| "eval_sickr_spearman": 0.8374597658637174, |
| "eval_stsb_spearman": 0.8587067189371913, |
| "step": 2050 |
| }, |
| { |
| "epoch": 2.02, |
| "eval_avg_sts": 0.8499478012984727, |
| "eval_sickr_spearman": 0.8390217853135862, |
| "eval_stsb_spearman": 0.8608738172833591, |
| "step": 2075 |
| }, |
| { |
| "epoch": 2.04, |
| "eval_avg_sts": 0.8491869466527012, |
| "eval_sickr_spearman": 0.8378290289715736, |
| "eval_stsb_spearman": 0.8605448643338288, |
| "step": 2100 |
| }, |
| { |
| "epoch": 2.07, |
| "eval_avg_sts": 0.8477584257424788, |
| "eval_sickr_spearman": 0.8359002920622246, |
| "eval_stsb_spearman": 0.8596165594227332, |
| "step": 2125 |
| }, |
| { |
| "epoch": 2.09, |
| "eval_avg_sts": 0.848914705769936, |
| "eval_sickr_spearman": 0.837553906822536, |
| "eval_stsb_spearman": 0.860275504717336, |
| "step": 2150 |
| }, |
| { |
| "epoch": 2.12, |
| "eval_avg_sts": 0.849736568959095, |
| "eval_sickr_spearman": 0.8393637187247242, |
| "eval_stsb_spearman": 0.860109419193466, |
| "step": 2175 |
| }, |
| { |
| "epoch": 2.14, |
| "eval_avg_sts": 0.8495688115163362, |
| "eval_sickr_spearman": 0.8389394600057214, |
| "eval_stsb_spearman": 0.860198163026951, |
| "step": 2200 |
| }, |
| { |
| "epoch": 2.17, |
| "eval_avg_sts": 0.8483895280681955, |
| "eval_sickr_spearman": 0.8374167780279301, |
| "eval_stsb_spearman": 0.8593622781084608, |
| "step": 2225 |
| }, |
| { |
| "epoch": 2.19, |
| "eval_avg_sts": 0.8490834154561102, |
| "eval_sickr_spearman": 0.8387396506237387, |
| "eval_stsb_spearman": 0.8594271802884818, |
| "step": 2250 |
| }, |
| { |
| "epoch": 2.22, |
| "eval_avg_sts": 0.8485035624729105, |
| "eval_sickr_spearman": 0.8381763418660725, |
| "eval_stsb_spearman": 0.8588307830797486, |
| "step": 2275 |
| }, |
| { |
| "epoch": 2.24, |
| "eval_avg_sts": 0.8476220200458998, |
| "eval_sickr_spearman": 0.8364356947499554, |
| "eval_stsb_spearman": 0.8588083453418442, |
| "step": 2300 |
| }, |
| { |
| "epoch": 2.26, |
| "eval_avg_sts": 0.8471502937152022, |
| "eval_sickr_spearman": 0.8358850662030688, |
| "eval_stsb_spearman": 0.8584155212273358, |
| "step": 2325 |
| }, |
| { |
| "epoch": 2.29, |
| "eval_avg_sts": 0.8481508305259742, |
| "eval_sickr_spearman": 0.8369382921954037, |
| "eval_stsb_spearman": 0.8593633688565446, |
| "step": 2350 |
| }, |
| { |
| "epoch": 2.31, |
| "eval_avg_sts": 0.8478439833733975, |
| "eval_sickr_spearman": 0.8367764273835573, |
| "eval_stsb_spearman": 0.8589115393632376, |
| "step": 2375 |
| }, |
| { |
| "epoch": 2.34, |
| "eval_avg_sts": 0.8466942437126351, |
| "eval_sickr_spearman": 0.8354506248905611, |
| "eval_stsb_spearman": 0.8579378625347092, |
| "step": 2400 |
| }, |
| { |
| "epoch": 2.36, |
| "eval_avg_sts": 0.8477441088420843, |
| "eval_sickr_spearman": 0.8366948705733154, |
| "eval_stsb_spearman": 0.8587933471108533, |
| "step": 2425 |
| }, |
| { |
| "epoch": 2.39, |
| "eval_avg_sts": 0.8488516946426614, |
| "eval_sickr_spearman": 0.8377335431419145, |
| "eval_stsb_spearman": 0.8599698461434083, |
| "step": 2450 |
| }, |
| { |
| "epoch": 2.41, |
| "eval_avg_sts": 0.8480771808294114, |
| "eval_sickr_spearman": 0.8370132207136473, |
| "eval_stsb_spearman": 0.8591411409451756, |
| "step": 2475 |
| }, |
| { |
| "epoch": 2.43, |
| "learning_rate": 1.8857513794222658e-06, |
| "loss": 0.2655, |
| "step": 2500 |
| }, |
| { |
| "epoch": 2.43, |
| "eval_avg_sts": 0.8487999481558521, |
| "eval_sickr_spearman": 0.8377923812411763, |
| "eval_stsb_spearman": 0.8598075150705279, |
| "step": 2500 |
| }, |
| { |
| "epoch": 2.46, |
| "eval_avg_sts": 0.848399750999945, |
| "eval_sickr_spearman": 0.8369205206878717, |
| "eval_stsb_spearman": 0.8598789813120182, |
| "step": 2525 |
| }, |
| { |
| "epoch": 2.48, |
| "eval_avg_sts": 0.8485584973593749, |
| "eval_sickr_spearman": 0.8373407447943537, |
| "eval_stsb_spearman": 0.8597762499243962, |
| "step": 2550 |
| }, |
| { |
| "epoch": 2.51, |
| "eval_avg_sts": 0.8484553378772859, |
| "eval_sickr_spearman": 0.8371878137673748, |
| "eval_stsb_spearman": 0.8597228619871968, |
| "step": 2575 |
| }, |
| { |
| "epoch": 2.53, |
| "eval_avg_sts": 0.8480636244098692, |
| "eval_sickr_spearman": 0.8368399244996585, |
| "eval_stsb_spearman": 0.8592873243200797, |
| "step": 2600 |
| }, |
| { |
| "epoch": 2.56, |
| "eval_avg_sts": 0.8487639345972604, |
| "eval_sickr_spearman": 0.8379995874127802, |
| "eval_stsb_spearman": 0.8595282817817406, |
| "step": 2625 |
| }, |
| { |
| "epoch": 2.58, |
| "eval_avg_sts": 0.8484073121905233, |
| "eval_sickr_spearman": 0.8373334920980365, |
| "eval_stsb_spearman": 0.85948113228301, |
| "step": 2650 |
| }, |
| { |
| "epoch": 2.6, |
| "eval_avg_sts": 0.8495353514397407, |
| "eval_sickr_spearman": 0.8388814384351839, |
| "eval_stsb_spearman": 0.8601892644442974, |
| "step": 2675 |
| }, |
| { |
| "epoch": 2.63, |
| "eval_avg_sts": 0.8488734860883285, |
| "eval_sickr_spearman": 0.8376559248819906, |
| "eval_stsb_spearman": 0.8600910472946663, |
| "step": 2700 |
| }, |
| { |
| "epoch": 2.65, |
| "eval_avg_sts": 0.8485291479370792, |
| "eval_sickr_spearman": 0.8370302717546578, |
| "eval_stsb_spearman": 0.8600280241195006, |
| "step": 2725 |
| }, |
| { |
| "epoch": 2.68, |
| "eval_avg_sts": 0.8484609936724099, |
| "eval_sickr_spearman": 0.8370401181304525, |
| "eval_stsb_spearman": 0.8598818692143673, |
| "step": 2750 |
| }, |
| { |
| "epoch": 2.7, |
| "eval_avg_sts": 0.8487467947632423, |
| "eval_sickr_spearman": 0.8374640886628467, |
| "eval_stsb_spearman": 0.8600295008636379, |
| "step": 2775 |
| }, |
| { |
| "epoch": 2.73, |
| "eval_avg_sts": 0.8487549703295775, |
| "eval_sickr_spearman": 0.8377412761492462, |
| "eval_stsb_spearman": 0.8597686645099087, |
| "step": 2800 |
| }, |
| { |
| "epoch": 2.75, |
| "eval_avg_sts": 0.8483512050356906, |
| "eval_sickr_spearman": 0.8371601478529463, |
| "eval_stsb_spearman": 0.8595422622184349, |
| "step": 2825 |
| }, |
| { |
| "epoch": 2.78, |
| "eval_avg_sts": 0.8487416863586705, |
| "eval_sickr_spearman": 0.8376103433667258, |
| "eval_stsb_spearman": 0.8598730293506154, |
| "step": 2850 |
| }, |
| { |
| "epoch": 2.8, |
| "eval_avg_sts": 0.8486695192263061, |
| "eval_sickr_spearman": 0.8374840215699435, |
| "eval_stsb_spearman": 0.8598550168826687, |
| "step": 2875 |
| }, |
| { |
| "epoch": 2.82, |
| "eval_avg_sts": 0.8490062168713867, |
| "eval_sickr_spearman": 0.8380430075284804, |
| "eval_stsb_spearman": 0.859969426214293, |
| "step": 2900 |
| }, |
| { |
| "epoch": 2.85, |
| "eval_avg_sts": 0.8488936976734611, |
| "eval_sickr_spearman": 0.8378850332358503, |
| "eval_stsb_spearman": 0.859902362111072, |
| "step": 2925 |
| }, |
| { |
| "epoch": 2.87, |
| "eval_avg_sts": 0.8489709020581676, |
| "eval_sickr_spearman": 0.8379462248590827, |
| "eval_stsb_spearman": 0.8599955792572526, |
| "step": 2950 |
| }, |
| { |
| "epoch": 2.9, |
| "eval_avg_sts": 0.8487957508450565, |
| "eval_sickr_spearman": 0.8376585185614683, |
| "eval_stsb_spearman": 0.8599329831286449, |
| "step": 2975 |
| }, |
| { |
| "epoch": 2.92, |
| "learning_rate": 2.6290165530671865e-07, |
| "loss": 0.263, |
| "step": 3000 |
| }, |
| { |
| "epoch": 2.92, |
| "eval_avg_sts": 0.8485199174178477, |
| "eval_sickr_spearman": 0.837266008400516, |
| "eval_stsb_spearman": 0.8597738264351793, |
| "step": 3000 |
| }, |
| { |
| "epoch": 2.95, |
| "eval_avg_sts": 0.8483285540592784, |
| "eval_sickr_spearman": 0.837077006016357, |
| "eval_stsb_spearman": 0.8595801021021999, |
| "step": 3025 |
| }, |
| { |
| "epoch": 2.97, |
| "eval_avg_sts": 0.8483039392081567, |
| "eval_sickr_spearman": 0.8370466464338976, |
| "eval_stsb_spearman": 0.8595612319824159, |
| "step": 3050 |
| }, |
| { |
| "epoch": 2.99, |
| "eval_avg_sts": 0.8482931559093356, |
| "eval_sickr_spearman": 0.837029215070426, |
| "eval_stsb_spearman": 0.8595570967482453, |
| "step": 3075 |
| }, |
| { |
| "epoch": 3.0, |
| "step": 3081, |
| "train_runtime": 8699.7484, |
| "train_samples_per_second": 0.354 |
| } |
| ], |
| "max_steps": 3081, |
| "num_train_epochs": 3, |
| "total_flos": 333879495592513536, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|