syncse-bert-large-uncased / trainer_state.json
leoner24's picture
Upload 9 files
4e77c55 verified
{
"best_metric": 0.8528364235468135,
"best_model_checkpoint": "checkpoints/bert-large-uncased",
"epoch": 3.0,
"global_step": 3081,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.02,
"eval_avg_sts": 0.7741718103390286,
"eval_sickr_spearman": 0.745954513736433,
"eval_stsb_spearman": 0.8023891069416242,
"step": 25
},
{
"epoch": 0.05,
"eval_avg_sts": 0.8081911987521978,
"eval_sickr_spearman": 0.779239730815335,
"eval_stsb_spearman": 0.8371426666890606,
"step": 50
},
{
"epoch": 0.07,
"eval_avg_sts": 0.8136161115454807,
"eval_sickr_spearman": 0.7835086390489516,
"eval_stsb_spearman": 0.8437235840420098,
"step": 75
},
{
"epoch": 0.1,
"eval_avg_sts": 0.8155047769520929,
"eval_sickr_spearman": 0.7852900645701897,
"eval_stsb_spearman": 0.845719489333996,
"step": 100
},
{
"epoch": 0.12,
"eval_avg_sts": 0.8238067491381542,
"eval_sickr_spearman": 0.7985816632400571,
"eval_stsb_spearman": 0.8490318350362512,
"step": 125
},
{
"epoch": 0.15,
"eval_avg_sts": 0.8224993495563874,
"eval_sickr_spearman": 0.7982152819982874,
"eval_stsb_spearman": 0.8467834171144873,
"step": 150
},
{
"epoch": 0.17,
"eval_avg_sts": 0.8263297389680633,
"eval_sickr_spearman": 0.8034025929225019,
"eval_stsb_spearman": 0.8492568850136247,
"step": 175
},
{
"epoch": 0.19,
"eval_avg_sts": 0.82711974150715,
"eval_sickr_spearman": 0.8028132513078563,
"eval_stsb_spearman": 0.8514262317064436,
"step": 200
},
{
"epoch": 0.22,
"eval_avg_sts": 0.8285051091857007,
"eval_sickr_spearman": 0.8064033359848481,
"eval_stsb_spearman": 0.8506068823865535,
"step": 225
},
{
"epoch": 0.24,
"eval_avg_sts": 0.8308924909456856,
"eval_sickr_spearman": 0.8108744071244177,
"eval_stsb_spearman": 0.8509105747669534,
"step": 250
},
{
"epoch": 0.27,
"eval_avg_sts": 0.8292742145946509,
"eval_sickr_spearman": 0.8081889402119113,
"eval_stsb_spearman": 0.8503594889773904,
"step": 275
},
{
"epoch": 0.29,
"eval_avg_sts": 0.8302783515064169,
"eval_sickr_spearman": 0.8108542340618137,
"eval_stsb_spearman": 0.8497024689510201,
"step": 300
},
{
"epoch": 0.32,
"eval_avg_sts": 0.8354548973044524,
"eval_sickr_spearman": 0.8162711816820041,
"eval_stsb_spearman": 0.8546386129269009,
"step": 325
},
{
"epoch": 0.34,
"eval_avg_sts": 0.8376245074641093,
"eval_sickr_spearman": 0.820640234762119,
"eval_stsb_spearman": 0.8546087801660995,
"step": 350
},
{
"epoch": 0.37,
"eval_avg_sts": 0.842346577377938,
"eval_sickr_spearman": 0.8251871470108594,
"eval_stsb_spearman": 0.8595060077450167,
"step": 375
},
{
"epoch": 0.39,
"eval_avg_sts": 0.8392487017993179,
"eval_sickr_spearman": 0.8222254052028811,
"eval_stsb_spearman": 0.8562719983957546,
"step": 400
},
{
"epoch": 0.41,
"eval_avg_sts": 0.836585408133989,
"eval_sickr_spearman": 0.8178774858073988,
"eval_stsb_spearman": 0.855293330460579,
"step": 425
},
{
"epoch": 0.44,
"eval_avg_sts": 0.8377417996341128,
"eval_sickr_spearman": 0.8186622659737961,
"eval_stsb_spearman": 0.8568213332944294,
"step": 450
},
{
"epoch": 0.46,
"eval_avg_sts": 0.8409718734645293,
"eval_sickr_spearman": 0.8244389665437579,
"eval_stsb_spearman": 0.8575047803853006,
"step": 475
},
{
"epoch": 0.49,
"learning_rate": 8.377150275884453e-06,
"loss": 0.5144,
"step": 500
},
{
"epoch": 0.49,
"eval_avg_sts": 0.8409672497360382,
"eval_sickr_spearman": 0.8242925677465746,
"eval_stsb_spearman": 0.8576419317255018,
"step": 500
},
{
"epoch": 0.51,
"eval_avg_sts": 0.8413119218825833,
"eval_sickr_spearman": 0.8241660538253865,
"eval_stsb_spearman": 0.85845778993978,
"step": 525
},
{
"epoch": 0.54,
"eval_avg_sts": 0.8405090163812534,
"eval_sickr_spearman": 0.8231903980618742,
"eval_stsb_spearman": 0.8578276347006326,
"step": 550
},
{
"epoch": 0.56,
"eval_avg_sts": 0.8461025764167975,
"eval_sickr_spearman": 0.8310040496127249,
"eval_stsb_spearman": 0.8612011032208701,
"step": 575
},
{
"epoch": 0.58,
"eval_avg_sts": 0.8447104900811846,
"eval_sickr_spearman": 0.8284478343941886,
"eval_stsb_spearman": 0.8609731457681805,
"step": 600
},
{
"epoch": 0.61,
"eval_avg_sts": 0.8462395445603483,
"eval_sickr_spearman": 0.8308051047905681,
"eval_stsb_spearman": 0.8616739843301284,
"step": 625
},
{
"epoch": 0.63,
"eval_avg_sts": 0.8436677522914944,
"eval_sickr_spearman": 0.8276286639591616,
"eval_stsb_spearman": 0.8597068406238272,
"step": 650
},
{
"epoch": 0.66,
"eval_avg_sts": 0.8447115186169327,
"eval_sickr_spearman": 0.8297105720509965,
"eval_stsb_spearman": 0.8597124651828688,
"step": 675
},
{
"epoch": 0.68,
"eval_avg_sts": 0.8434972279862564,
"eval_sickr_spearman": 0.8294735385653995,
"eval_stsb_spearman": 0.8575209174071132,
"step": 700
},
{
"epoch": 0.71,
"eval_avg_sts": 0.8440935405127372,
"eval_sickr_spearman": 0.8307528469522036,
"eval_stsb_spearman": 0.8574342340732707,
"step": 725
},
{
"epoch": 0.73,
"eval_avg_sts": 0.8430030266304707,
"eval_sickr_spearman": 0.8273284695751733,
"eval_stsb_spearman": 0.858677583685768,
"step": 750
},
{
"epoch": 0.75,
"eval_avg_sts": 0.8459169389588843,
"eval_sickr_spearman": 0.8317631811709543,
"eval_stsb_spearman": 0.8600706967468144,
"step": 775
},
{
"epoch": 0.78,
"eval_avg_sts": 0.8451542594549106,
"eval_sickr_spearman": 0.8302367527672511,
"eval_stsb_spearman": 0.8600717661425702,
"step": 800
},
{
"epoch": 0.8,
"eval_avg_sts": 0.8441819324586433,
"eval_sickr_spearman": 0.8280832303031719,
"eval_stsb_spearman": 0.8602806346141146,
"step": 825
},
{
"epoch": 0.83,
"eval_avg_sts": 0.84041329364274,
"eval_sickr_spearman": 0.8234209671109596,
"eval_stsb_spearman": 0.8574056201745204,
"step": 850
},
{
"epoch": 0.85,
"eval_avg_sts": 0.8463098863081795,
"eval_sickr_spearman": 0.8311718222500483,
"eval_stsb_spearman": 0.8614479503663108,
"step": 875
},
{
"epoch": 0.88,
"eval_avg_sts": 0.8489707536403015,
"eval_sickr_spearman": 0.8359545191757484,
"eval_stsb_spearman": 0.8619869881048546,
"step": 900
},
{
"epoch": 0.9,
"eval_avg_sts": 0.8459381219997153,
"eval_sickr_spearman": 0.8324996900804063,
"eval_stsb_spearman": 0.8593765539190245,
"step": 925
},
{
"epoch": 0.93,
"eval_avg_sts": 0.8441563920982813,
"eval_sickr_spearman": 0.8308032796087136,
"eval_stsb_spearman": 0.8575095045878491,
"step": 950
},
{
"epoch": 0.95,
"eval_avg_sts": 0.8417274944195297,
"eval_sickr_spearman": 0.8286961551886236,
"eval_stsb_spearman": 0.8547588336504358,
"step": 975
},
{
"epoch": 0.97,
"learning_rate": 6.754300551768907e-06,
"loss": 0.338,
"step": 1000
},
{
"epoch": 0.97,
"eval_avg_sts": 0.8439797180911035,
"eval_sickr_spearman": 0.8322901784159331,
"eval_stsb_spearman": 0.8556692577662738,
"step": 1000
},
{
"epoch": 1.0,
"eval_avg_sts": 0.846580279698808,
"eval_sickr_spearman": 0.8351822751268263,
"eval_stsb_spearman": 0.8579782842707896,
"step": 1025
},
{
"epoch": 1.02,
"eval_avg_sts": 0.8444154454958996,
"eval_sickr_spearman": 0.8319871021658588,
"eval_stsb_spearman": 0.8568437888259406,
"step": 1050
},
{
"epoch": 1.05,
"eval_avg_sts": 0.8432409670453203,
"eval_sickr_spearman": 0.8314499703584763,
"eval_stsb_spearman": 0.8550319637321643,
"step": 1075
},
{
"epoch": 1.07,
"eval_avg_sts": 0.8446753892080279,
"eval_sickr_spearman": 0.8331656893329471,
"eval_stsb_spearman": 0.8561850890831085,
"step": 1100
},
{
"epoch": 1.1,
"eval_avg_sts": 0.8474510190292008,
"eval_sickr_spearman": 0.8356278596548676,
"eval_stsb_spearman": 0.8592741784035342,
"step": 1125
},
{
"epoch": 1.12,
"eval_avg_sts": 0.8505734569059473,
"eval_sickr_spearman": 0.8389641479918606,
"eval_stsb_spearman": 0.862182765820034,
"step": 1150
},
{
"epoch": 1.14,
"eval_avg_sts": 0.8521021908496921,
"eval_sickr_spearman": 0.8412426954129831,
"eval_stsb_spearman": 0.862961686286401,
"step": 1175
},
{
"epoch": 1.17,
"eval_avg_sts": 0.8514560490494238,
"eval_sickr_spearman": 0.840301718104709,
"eval_stsb_spearman": 0.8626103799941387,
"step": 1200
},
{
"epoch": 1.19,
"eval_avg_sts": 0.8486972541916555,
"eval_sickr_spearman": 0.8367856973861348,
"eval_stsb_spearman": 0.8606088109971762,
"step": 1225
},
{
"epoch": 1.22,
"eval_avg_sts": 0.848898608926278,
"eval_sickr_spearman": 0.8370826736863266,
"eval_stsb_spearman": 0.8607145441662293,
"step": 1250
},
{
"epoch": 1.24,
"eval_avg_sts": 0.8454701656945296,
"eval_sickr_spearman": 0.8321730305595257,
"eval_stsb_spearman": 0.8587673008295333,
"step": 1275
},
{
"epoch": 1.27,
"eval_avg_sts": 0.8452672490522616,
"eval_sickr_spearman": 0.833004064676608,
"eval_stsb_spearman": 0.8575304334279151,
"step": 1300
},
{
"epoch": 1.29,
"eval_avg_sts": 0.8489039116599046,
"eval_sickr_spearman": 0.8371614927237867,
"eval_stsb_spearman": 0.8606463305960226,
"step": 1325
},
{
"epoch": 1.31,
"eval_avg_sts": 0.8467466937976185,
"eval_sickr_spearman": 0.8343573409596268,
"eval_stsb_spearman": 0.85913604663561,
"step": 1350
},
{
"epoch": 1.34,
"eval_avg_sts": 0.8479786014484607,
"eval_sickr_spearman": 0.8356114810492773,
"eval_stsb_spearman": 0.8603457218476441,
"step": 1375
},
{
"epoch": 1.36,
"eval_avg_sts": 0.8481320629670138,
"eval_sickr_spearman": 0.8365469828119875,
"eval_stsb_spearman": 0.8597171431220402,
"step": 1400
},
{
"epoch": 1.39,
"eval_avg_sts": 0.8493017107452288,
"eval_sickr_spearman": 0.8375811404570515,
"eval_stsb_spearman": 0.8610222810334061,
"step": 1425
},
{
"epoch": 1.41,
"eval_avg_sts": 0.8515707185583519,
"eval_sickr_spearman": 0.8413120523234598,
"eval_stsb_spearman": 0.8618293847932439,
"step": 1450
},
{
"epoch": 1.44,
"eval_avg_sts": 0.8491061717045717,
"eval_sickr_spearman": 0.8386661630385385,
"eval_stsb_spearman": 0.8595461803706049,
"step": 1475
},
{
"epoch": 1.46,
"learning_rate": 5.131450827653359e-06,
"loss": 0.2965,
"step": 1500
},
{
"epoch": 1.46,
"eval_avg_sts": 0.849951123911407,
"eval_sickr_spearman": 0.8403214588874001,
"eval_stsb_spearman": 0.859580788935414,
"step": 1500
},
{
"epoch": 1.48,
"eval_avg_sts": 0.8462728434267617,
"eval_sickr_spearman": 0.8349335220524785,
"eval_stsb_spearman": 0.8576121648010449,
"step": 1525
},
{
"epoch": 1.51,
"eval_avg_sts": 0.8478142980726532,
"eval_sickr_spearman": 0.8355811253931684,
"eval_stsb_spearman": 0.8600474707521379,
"step": 1550
},
{
"epoch": 1.53,
"eval_avg_sts": 0.8506859270446779,
"eval_sickr_spearman": 0.8387632819256463,
"eval_stsb_spearman": 0.8626085721637096,
"step": 1575
},
{
"epoch": 1.56,
"eval_avg_sts": 0.8491205822275252,
"eval_sickr_spearman": 0.8368930468978489,
"eval_stsb_spearman": 0.8613481175572015,
"step": 1600
},
{
"epoch": 1.58,
"eval_avg_sts": 0.8460304537726628,
"eval_sickr_spearman": 0.8335511389219881,
"eval_stsb_spearman": 0.8585097686233377,
"step": 1625
},
{
"epoch": 1.61,
"eval_avg_sts": 0.8488092782108085,
"eval_sickr_spearman": 0.8360739244939235,
"eval_stsb_spearman": 0.8615446319276937,
"step": 1650
},
{
"epoch": 1.63,
"eval_avg_sts": 0.8483771836085118,
"eval_sickr_spearman": 0.8353614791662919,
"eval_stsb_spearman": 0.8613928880507317,
"step": 1675
},
{
"epoch": 1.66,
"eval_avg_sts": 0.8482633646541247,
"eval_sickr_spearman": 0.835166232738946,
"eval_stsb_spearman": 0.8613604965693032,
"step": 1700
},
{
"epoch": 1.68,
"eval_avg_sts": 0.8494820125153382,
"eval_sickr_spearman": 0.8363321877263562,
"eval_stsb_spearman": 0.8626318373043202,
"step": 1725
},
{
"epoch": 1.7,
"eval_avg_sts": 0.84774811911999,
"eval_sickr_spearman": 0.8350676729187949,
"eval_stsb_spearman": 0.8604285653211853,
"step": 1750
},
{
"epoch": 1.73,
"eval_avg_sts": 0.8508953589183318,
"eval_sickr_spearman": 0.8393342276284411,
"eval_stsb_spearman": 0.8624564902082225,
"step": 1775
},
{
"epoch": 1.75,
"eval_avg_sts": 0.8497877526052855,
"eval_sickr_spearman": 0.8380021810922581,
"eval_stsb_spearman": 0.861573324118313,
"step": 1800
},
{
"epoch": 1.78,
"eval_avg_sts": 0.847915612163006,
"eval_sickr_spearman": 0.8351774720166826,
"eval_stsb_spearman": 0.8606537523093295,
"step": 1825
},
{
"epoch": 1.8,
"eval_avg_sts": 0.8496201121858785,
"eval_sickr_spearman": 0.8377723042407751,
"eval_stsb_spearman": 0.861467920130982,
"step": 1850
},
{
"epoch": 1.83,
"eval_avg_sts": 0.8506282266864784,
"eval_sickr_spearman": 0.8396311078664301,
"eval_stsb_spearman": 0.8616253455065267,
"step": 1875
},
{
"epoch": 1.85,
"eval_avg_sts": 0.8507148324349076,
"eval_sickr_spearman": 0.8398456147654526,
"eval_stsb_spearman": 0.8615840501043628,
"step": 1900
},
{
"epoch": 1.87,
"eval_avg_sts": 0.8528364235468135,
"eval_sickr_spearman": 0.8424179684340722,
"eval_stsb_spearman": 0.8632548786595547,
"step": 1925
},
{
"epoch": 1.9,
"eval_avg_sts": 0.8505338171378869,
"eval_sickr_spearman": 0.8398606965313044,
"eval_stsb_spearman": 0.8612069377444695,
"step": 1950
},
{
"epoch": 1.92,
"eval_avg_sts": 0.8481722210917726,
"eval_sickr_spearman": 0.8373791216444029,
"eval_stsb_spearman": 0.8589653205391424,
"step": 1975
},
{
"epoch": 1.95,
"learning_rate": 3.5086011035378126e-06,
"loss": 0.284,
"step": 2000
},
{
"epoch": 1.95,
"eval_avg_sts": 0.8482272752573701,
"eval_sickr_spearman": 0.8377695664679932,
"eval_stsb_spearman": 0.858684984046747,
"step": 2000
},
{
"epoch": 1.97,
"eval_avg_sts": 0.8480501028062337,
"eval_sickr_spearman": 0.837576385378009,
"eval_stsb_spearman": 0.8585238202344584,
"step": 2025
},
{
"epoch": 2.0,
"eval_avg_sts": 0.8480832424004543,
"eval_sickr_spearman": 0.8374597658637174,
"eval_stsb_spearman": 0.8587067189371913,
"step": 2050
},
{
"epoch": 2.02,
"eval_avg_sts": 0.8499478012984727,
"eval_sickr_spearman": 0.8390217853135862,
"eval_stsb_spearman": 0.8608738172833591,
"step": 2075
},
{
"epoch": 2.04,
"eval_avg_sts": 0.8491869466527012,
"eval_sickr_spearman": 0.8378290289715736,
"eval_stsb_spearman": 0.8605448643338288,
"step": 2100
},
{
"epoch": 2.07,
"eval_avg_sts": 0.8477584257424788,
"eval_sickr_spearman": 0.8359002920622246,
"eval_stsb_spearman": 0.8596165594227332,
"step": 2125
},
{
"epoch": 2.09,
"eval_avg_sts": 0.848914705769936,
"eval_sickr_spearman": 0.837553906822536,
"eval_stsb_spearman": 0.860275504717336,
"step": 2150
},
{
"epoch": 2.12,
"eval_avg_sts": 0.849736568959095,
"eval_sickr_spearman": 0.8393637187247242,
"eval_stsb_spearman": 0.860109419193466,
"step": 2175
},
{
"epoch": 2.14,
"eval_avg_sts": 0.8495688115163362,
"eval_sickr_spearman": 0.8389394600057214,
"eval_stsb_spearman": 0.860198163026951,
"step": 2200
},
{
"epoch": 2.17,
"eval_avg_sts": 0.8483895280681955,
"eval_sickr_spearman": 0.8374167780279301,
"eval_stsb_spearman": 0.8593622781084608,
"step": 2225
},
{
"epoch": 2.19,
"eval_avg_sts": 0.8490834154561102,
"eval_sickr_spearman": 0.8387396506237387,
"eval_stsb_spearman": 0.8594271802884818,
"step": 2250
},
{
"epoch": 2.22,
"eval_avg_sts": 0.8485035624729105,
"eval_sickr_spearman": 0.8381763418660725,
"eval_stsb_spearman": 0.8588307830797486,
"step": 2275
},
{
"epoch": 2.24,
"eval_avg_sts": 0.8476220200458998,
"eval_sickr_spearman": 0.8364356947499554,
"eval_stsb_spearman": 0.8588083453418442,
"step": 2300
},
{
"epoch": 2.26,
"eval_avg_sts": 0.8471502937152022,
"eval_sickr_spearman": 0.8358850662030688,
"eval_stsb_spearman": 0.8584155212273358,
"step": 2325
},
{
"epoch": 2.29,
"eval_avg_sts": 0.8481508305259742,
"eval_sickr_spearman": 0.8369382921954037,
"eval_stsb_spearman": 0.8593633688565446,
"step": 2350
},
{
"epoch": 2.31,
"eval_avg_sts": 0.8478439833733975,
"eval_sickr_spearman": 0.8367764273835573,
"eval_stsb_spearman": 0.8589115393632376,
"step": 2375
},
{
"epoch": 2.34,
"eval_avg_sts": 0.8466942437126351,
"eval_sickr_spearman": 0.8354506248905611,
"eval_stsb_spearman": 0.8579378625347092,
"step": 2400
},
{
"epoch": 2.36,
"eval_avg_sts": 0.8477441088420843,
"eval_sickr_spearman": 0.8366948705733154,
"eval_stsb_spearman": 0.8587933471108533,
"step": 2425
},
{
"epoch": 2.39,
"eval_avg_sts": 0.8488516946426614,
"eval_sickr_spearman": 0.8377335431419145,
"eval_stsb_spearman": 0.8599698461434083,
"step": 2450
},
{
"epoch": 2.41,
"eval_avg_sts": 0.8480771808294114,
"eval_sickr_spearman": 0.8370132207136473,
"eval_stsb_spearman": 0.8591411409451756,
"step": 2475
},
{
"epoch": 2.43,
"learning_rate": 1.8857513794222658e-06,
"loss": 0.2655,
"step": 2500
},
{
"epoch": 2.43,
"eval_avg_sts": 0.8487999481558521,
"eval_sickr_spearman": 0.8377923812411763,
"eval_stsb_spearman": 0.8598075150705279,
"step": 2500
},
{
"epoch": 2.46,
"eval_avg_sts": 0.848399750999945,
"eval_sickr_spearman": 0.8369205206878717,
"eval_stsb_spearman": 0.8598789813120182,
"step": 2525
},
{
"epoch": 2.48,
"eval_avg_sts": 0.8485584973593749,
"eval_sickr_spearman": 0.8373407447943537,
"eval_stsb_spearman": 0.8597762499243962,
"step": 2550
},
{
"epoch": 2.51,
"eval_avg_sts": 0.8484553378772859,
"eval_sickr_spearman": 0.8371878137673748,
"eval_stsb_spearman": 0.8597228619871968,
"step": 2575
},
{
"epoch": 2.53,
"eval_avg_sts": 0.8480636244098692,
"eval_sickr_spearman": 0.8368399244996585,
"eval_stsb_spearman": 0.8592873243200797,
"step": 2600
},
{
"epoch": 2.56,
"eval_avg_sts": 0.8487639345972604,
"eval_sickr_spearman": 0.8379995874127802,
"eval_stsb_spearman": 0.8595282817817406,
"step": 2625
},
{
"epoch": 2.58,
"eval_avg_sts": 0.8484073121905233,
"eval_sickr_spearman": 0.8373334920980365,
"eval_stsb_spearman": 0.85948113228301,
"step": 2650
},
{
"epoch": 2.6,
"eval_avg_sts": 0.8495353514397407,
"eval_sickr_spearman": 0.8388814384351839,
"eval_stsb_spearman": 0.8601892644442974,
"step": 2675
},
{
"epoch": 2.63,
"eval_avg_sts": 0.8488734860883285,
"eval_sickr_spearman": 0.8376559248819906,
"eval_stsb_spearman": 0.8600910472946663,
"step": 2700
},
{
"epoch": 2.65,
"eval_avg_sts": 0.8485291479370792,
"eval_sickr_spearman": 0.8370302717546578,
"eval_stsb_spearman": 0.8600280241195006,
"step": 2725
},
{
"epoch": 2.68,
"eval_avg_sts": 0.8484609936724099,
"eval_sickr_spearman": 0.8370401181304525,
"eval_stsb_spearman": 0.8598818692143673,
"step": 2750
},
{
"epoch": 2.7,
"eval_avg_sts": 0.8487467947632423,
"eval_sickr_spearman": 0.8374640886628467,
"eval_stsb_spearman": 0.8600295008636379,
"step": 2775
},
{
"epoch": 2.73,
"eval_avg_sts": 0.8487549703295775,
"eval_sickr_spearman": 0.8377412761492462,
"eval_stsb_spearman": 0.8597686645099087,
"step": 2800
},
{
"epoch": 2.75,
"eval_avg_sts": 0.8483512050356906,
"eval_sickr_spearman": 0.8371601478529463,
"eval_stsb_spearman": 0.8595422622184349,
"step": 2825
},
{
"epoch": 2.78,
"eval_avg_sts": 0.8487416863586705,
"eval_sickr_spearman": 0.8376103433667258,
"eval_stsb_spearman": 0.8598730293506154,
"step": 2850
},
{
"epoch": 2.8,
"eval_avg_sts": 0.8486695192263061,
"eval_sickr_spearman": 0.8374840215699435,
"eval_stsb_spearman": 0.8598550168826687,
"step": 2875
},
{
"epoch": 2.82,
"eval_avg_sts": 0.8490062168713867,
"eval_sickr_spearman": 0.8380430075284804,
"eval_stsb_spearman": 0.859969426214293,
"step": 2900
},
{
"epoch": 2.85,
"eval_avg_sts": 0.8488936976734611,
"eval_sickr_spearman": 0.8378850332358503,
"eval_stsb_spearman": 0.859902362111072,
"step": 2925
},
{
"epoch": 2.87,
"eval_avg_sts": 0.8489709020581676,
"eval_sickr_spearman": 0.8379462248590827,
"eval_stsb_spearman": 0.8599955792572526,
"step": 2950
},
{
"epoch": 2.9,
"eval_avg_sts": 0.8487957508450565,
"eval_sickr_spearman": 0.8376585185614683,
"eval_stsb_spearman": 0.8599329831286449,
"step": 2975
},
{
"epoch": 2.92,
"learning_rate": 2.6290165530671865e-07,
"loss": 0.263,
"step": 3000
},
{
"epoch": 2.92,
"eval_avg_sts": 0.8485199174178477,
"eval_sickr_spearman": 0.837266008400516,
"eval_stsb_spearman": 0.8597738264351793,
"step": 3000
},
{
"epoch": 2.95,
"eval_avg_sts": 0.8483285540592784,
"eval_sickr_spearman": 0.837077006016357,
"eval_stsb_spearman": 0.8595801021021999,
"step": 3025
},
{
"epoch": 2.97,
"eval_avg_sts": 0.8483039392081567,
"eval_sickr_spearman": 0.8370466464338976,
"eval_stsb_spearman": 0.8595612319824159,
"step": 3050
},
{
"epoch": 2.99,
"eval_avg_sts": 0.8482931559093356,
"eval_sickr_spearman": 0.837029215070426,
"eval_stsb_spearman": 0.8595570967482453,
"step": 3075
},
{
"epoch": 3.0,
"step": 3081,
"train_runtime": 8699.7484,
"train_samples_per_second": 0.354
}
],
"max_steps": 3081,
"num_train_epochs": 3,
"total_flos": 333879495592513536,
"trial_name": null,
"trial_params": null
}