HA_Model / history.json
s672's picture
Upload 349 files
6517100 verified
[
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7139888211265206,
"ce": 2.173877529203892,
"ppl": 60.757540481090544,
"ce_q1": 2.1838535536527632,
"ppl_q1": 115.62192355263234,
"ce_q2": 2.1138189733922483,
"ppl_q2": 48.1492883554697,
"ce_q3": 2.1145093555152417,
"ppl_q3": 46.6759974821806,
"ce_q4": 2.283328231215477,
"ppl_q4": 55.76164192140102,
"duration": 9990.135685920715
},
"valid": {
"ce": 1.0578475564341001,
"ppl": 2.893735858458507,
"ce_q1": 0.8746125328389904,
"ppl_q1": 2.4088701175737985,
"ce_q2": 1.0117945640901975,
"ppl_q2": 2.7619081660162044,
"ce_q3": 1.1037901828560648,
"ppl_q3": 3.0297150551518306,
"ce_q4": 1.2411929655678664,
"ppl_q4": 3.4810384315780447,
"duration": 407.02404022216797
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8952568171471358,
"ce": 0.7622833101004363,
"ppl": 2.1785739208459853,
"ce_q1": 0.6102545861527324,
"ppl_q1": 1.8633524129390717,
"ce_q2": 0.7152881208211184,
"ppl_q2": 2.0762058873176574,
"ce_q3": 0.8027887784391642,
"ppl_q3": 2.2717719178795814,
"ce_q4": 0.9208017558455467,
"ppl_q4": 2.5662533673644066,
"duration": 9709.127085208893
},
"valid": {
"ce": 0.5298309620422653,
"ppl": 1.7057806615588031,
"ce_q1": 0.4215273404423195,
"ppl_q1": 1.5294293919696083,
"ce_q2": 0.4916270382796662,
"ppl_q2": 1.6408522943907147,
"ce_q3": 0.556915718166134,
"ppl_q3": 1.7529149945778182,
"ce_q4": 0.6492537422270714,
"ppl_q4": 1.9257941849624054,
"duration": 364.33030819892883
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.658758140772581,
"ce": 0.458900987342,
"ppl": 1.5914587651491165,
"ce_q1": 0.3663528805151582,
"ppl_q1": 1.4481512227654456,
"ce_q2": 0.42124617391079666,
"ppl_q2": 1.5312033806443215,
"ce_q3": 0.483467122554779,
"ppl_q3": 1.6320633321404456,
"ce_q4": 0.5645377744883299,
"ppl_q4": 1.774294057071209,
"duration": 9646.101248264313
},
"valid": {
"ce": 0.38792591796645637,
"ppl": 1.4795975096618073,
"ce_q1": 0.30983398270003404,
"ppl_q1": 1.3670947385739676,
"ce_q2": 0.3550876360150832,
"ppl_q2": 1.4309432476381712,
"ce_q3": 0.40832054332087314,
"ppl_q3": 1.5104784844796868,
"ce_q4": 0.47846151039570195,
"ppl_q4": 1.623000833052623,
"duration": 363.99295449256897
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.3027846738621593,
"ce": 0.3782431591376662,
"ppl": 1.4659199578762054,
"ce_q1": 0.2969039410613477,
"ppl_q1": 1.3493805121183395,
"ce_q2": 0.34252556386962535,
"ppl_q2": 1.4133179208040239,
"ce_q3": 0.4013441359847784,
"ppl_q3": 1.501078657746315,
"ce_q4": 0.47219899725914,
"ppl_q4": 1.6146215254068375,
"duration": 9648.554844141006
},
"valid": {
"ce": 0.34699366515195823,
"ppl": 1.4197162238857415,
"ce_q1": 0.26978387730785564,
"ppl_q1": 1.3128716945648193,
"ce_q2": 0.31475139550770387,
"ppl_q2": 1.3738903229749655,
"ce_q3": 0.3679725367434417,
"ppl_q3": 1.4502526084079017,
"ce_q4": 0.43546685236918775,
"ppl_q4": 1.5540713524516625,
"duration": 363.93863797187805
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.0682765308991073,
"ce": 0.35051629208773377,
"ppl": 1.4252898921966553,
"ce_q1": 0.2686901425383985,
"ppl_q1": 1.3113990955948829,
"ce_q2": 0.31552755162119867,
"ppl_q2": 1.3753161788582802,
"ce_q3": 0.37402332600206134,
"ppl_q3": 1.4600041140317916,
"ce_q4": 0.4438241482302546,
"ppl_q4": 1.5685892715454102,
"duration": 9649.992606163025
},
"valid": {
"ce": 0.32724237743812273,
"ppl": 1.3915840145907825,
"ce_q1": 0.24782562444481668,
"ppl_q1": 1.2839867570732213,
"ce_q2": 0.2951959688452226,
"ppl_q2": 1.3469665367392045,
"ce_q3": 0.34943927484977094,
"ppl_q3": 1.423286943496028,
"ce_q4": 0.41650864557374884,
"ppl_q4": 1.5244485185116152,
"duration": 364.2623555660248
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9062350554391742,
"ce": 0.33277938460931183,
"ppl": 1.3996739456653595,
"ce_q1": 0.2489357072636485,
"ppl_q1": 1.2853037230372428,
"ce_q2": 0.29807595055550334,
"ppl_q2": 1.3510140706300735,
"ce_q3": 0.3579772567413747,
"ppl_q3": 1.4362133738994598,
"ce_q4": 0.4261286235898733,
"ppl_q4": 1.5402889256477357,
"duration": 9648.130340576172
},
"valid": {
"ce": 0.3147100759080694,
"ppl": 1.3739739233934427,
"ce_q1": 0.2329047514667994,
"ppl_q1": 1.2647000173979168,
"ce_q2": 0.2826218190072458,
"ppl_q2": 1.3298912576482267,
"ce_q3": 0.3380027720822564,
"ppl_q3": 1.406846349752402,
"ce_q4": 0.4053109520221058,
"ppl_q4": 1.5071273800692981,
"duration": 364.70765686035156
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8160633453838527,
"ce": 0.32220307441055773,
"ppl": 1.3845142503976822,
"ce_q1": 0.23596069633774458,
"ppl_q1": 1.2684047619104386,
"ce_q2": 0.28701483193412425,
"ppl_q2": 1.3358310987353326,
"ce_q3": 0.34841247890517113,
"ppl_q3": 1.4220430172085763,
"ce_q4": 0.41742429112270474,
"ppl_q4": 1.5263461983203888,
"duration": 9692.624699831009
},
"valid": {
"ce": 0.30420554778243925,
"ppl": 1.3594117843652074,
"ce_q1": 0.22103732060405273,
"ppl_q1": 1.2495773110208632,
"ce_q2": 0.27224719845041445,
"ppl_q2": 1.3159875794302058,
"ce_q3": 0.3283630643464342,
"ppl_q3": 1.3931568830828123,
"ce_q4": 0.3951746132932132,
"ppl_q4": 1.4916874834253817,
"duration": 369.0870785713196
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7958583693131804,
"ce": 0.3171371899656951,
"ppl": 1.3774234347939491,
"ce_q1": 0.22851442461833357,
"ppl_q1": 1.2588756356835364,
"ce_q2": 0.28210394644364717,
"ppl_q2": 1.3291933022141456,
"ce_q3": 0.3442181306555867,
"ppl_q3": 1.416022645831108,
"ce_q4": 0.41371225610747936,
"ppl_q4": 1.5206376270651818,
"duration": 9762.89295744896
},
"valid": {
"ce": 0.2970876716360261,
"ppl": 1.34960645059996,
"ce_q1": 0.21255999331987357,
"ppl_q1": 1.2388748156873486,
"ce_q2": 0.26519824168350126,
"ppl_q2": 1.3066016707239272,
"ce_q3": 0.3218034285156033,
"ppl_q3": 1.383894911295251,
"ce_q4": 0.38878902377961555,
"ppl_q4": 1.4819832376286954,
"duration": 367.2382125854492
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6960099772140383,
"ce": 0.30420715733245013,
"ppl": 1.3594656380414962,
"ce_q1": 0.21638601769134402,
"ppl_q1": 1.2435167224407195,
"ce_q2": 0.2696109323315322,
"ppl_q2": 1.312455210864544,
"ce_q3": 0.3314019359536469,
"ppl_q3": 1.3977243483662605,
"ce_q4": 0.3994297444149852,
"ppl_q4": 1.4986227390766145,
"duration": 9715.029719114304
},
"valid": {
"ce": 0.2905795821283437,
"ppl": 1.3407156723964064,
"ce_q1": 0.20514852742228326,
"ppl_q1": 1.2296004612234575,
"ce_q2": 0.258691531004785,
"ppl_q2": 1.2980141745337956,
"ce_q3": 0.3158856319098533,
"ppl_q3": 1.3756032654001742,
"ce_q4": 0.3825926384593867,
"ppl_q4": 1.472645480421525,
"duration": 367.7969195842743
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6388504648953677,
"ce": 0.30012047858908775,
"ppl": 1.353954707980156,
"ce_q1": 0.2106539978440851,
"ppl_q1": 1.2363694159984588,
"ce_q2": 0.26583316499739884,
"ppl_q2": 1.307574811577797,
"ce_q3": 0.3279107775203884,
"ppl_q3": 1.3928812025785446,
"ce_q4": 0.39608397559076547,
"ppl_q4": 1.4937362524867057,
"duration": 9720.47579050064
},
"valid": {
"ce": 0.28552053642423847,
"ppl": 1.3338418565218961,
"ce_q1": 0.19924037516871584,
"ppl_q1": 1.2222560070738007,
"ce_q2": 0.25374761110619654,
"ppl_q2": 1.2915204989759228,
"ce_q3": 0.3112158682904666,
"ppl_q3": 1.369094812417332,
"ce_q4": 0.37787828585015065,
"ppl_q4": 1.4655752000929434,
"duration": 367.7100245952606
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6235386055484414,
"ce": 0.2924809884876013,
"ppl": 1.3434701552391053,
"ce_q1": 0.20310996603965759,
"ppl_q1": 1.22693498057127,
"ce_q2": 0.2580702159292996,
"ppl_q2": 1.2972542500495912,
"ce_q3": 0.32043501345813274,
"ppl_q3": 1.3823249989748,
"ce_q4": 0.3883087599426508,
"ppl_q4": 1.4819999898076057,
"duration": 9698.74122428894
},
"valid": {
"ce": 0.28094224386577366,
"ppl": 1.3276541912103001,
"ce_q1": 0.1938464087964613,
"ppl_q1": 1.2155920493451855,
"ce_q2": 0.2491917037699796,
"ppl_q2": 1.285567599006846,
"ce_q3": 0.30707791108119337,
"ppl_q3": 1.3633532614647588,
"ce_q4": 0.37365295822861827,
"ppl_q4": 1.4592749212361589,
"duration": 367.3377423286438
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5876407694742084,
"ce": 0.2887481169402599,
"ppl": 1.3383552740216256,
"ce_q1": 0.19843788331374526,
"ppl_q1": 1.2211602177619933,
"ce_q2": 0.25461827327869835,
"ppl_q2": 1.2926731531620026,
"ce_q3": 0.3171204995252192,
"ppl_q3": 1.377650060415268,
"ce_q4": 0.38481581097096207,
"ppl_q4": 1.4766370559334754,
"duration": 9717.98500752449
},
"valid": {
"ce": 0.2786048092419588,
"ppl": 1.324477858181241,
"ce_q1": 0.19018569767852372,
"ppl_q1": 1.2110804108124744,
"ce_q2": 0.2471336680877058,
"ppl_q2": 1.2828661927694007,
"ce_q3": 0.305224463154998,
"ppl_q3": 1.3607573494126526,
"ce_q4": 0.3718754134223431,
"ppl_q4": 1.456569484517544,
"duration": 370.4252426624298
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5885659677907824,
"ce": 0.28598406685143707,
"ppl": 1.334572199881077,
"ce_q1": 0.19475941846705974,
"ppl_q1": 1.216597157895565,
"ce_q2": 0.2518067127354443,
"ppl_q2": 1.288983304440975,
"ce_q3": 0.31456935868039726,
"ppl_q3": 1.3740696684718132,
"ce_q4": 0.38280077784135935,
"ppl_q4": 1.473509496152401,
"duration": 9734.229039430618
},
"valid": {
"ce": 0.273724911710884,
"ppl": 1.317958207070073,
"ce_q1": 0.1852767831539806,
"ppl_q1": 1.2050870928583266,
"ce_q2": 0.2420956643321846,
"ppl_q2": 1.2763538405865054,
"ce_q3": 0.3005852057963987,
"ppl_q3": 1.3543842412248444,
"ce_q4": 0.36694199771066255,
"ppl_q4": 1.4493156083022491,
"duration": 368.0145206451416
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5636666735336184,
"ce": 0.28117746782302855,
"ppl": 1.327986912548542,
"ce_q1": 0.19029672830551864,
"ppl_q1": 1.211112559556961,
"ce_q2": 0.247117908898741,
"ppl_q2": 1.2828307807445527,
"ce_q3": 0.30988553999736906,
"ppl_q3": 1.3673929714560509,
"ce_q4": 0.3774096945002675,
"ppl_q4": 1.4651751166582108,
"duration": 9727.160143852234
},
"valid": {
"ce": 0.27079825291905224,
"ppl": 1.3140449931349936,
"ce_q1": 0.1818210709887215,
"ppl_q1": 1.2008746877501282,
"ce_q2": 0.23923172339608398,
"ppl_q2": 1.2726502795762653,
"ce_q3": 0.29776253372053557,
"ppl_q3": 1.3505052675174762,
"ce_q4": 0.3643776838538013,
"ppl_q4": 1.4455288286450543,
"duration": 369.49280071258545
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5610072636976838,
"ce": 0.2791029617264867,
"ppl": 1.324917121231556,
"ce_q1": 0.18736792962439358,
"ppl_q1": 1.2074093613624572,
"ce_q2": 0.24472872881032526,
"ppl_q2": 1.2795293309092521,
"ce_q3": 0.30828770226985214,
"ppl_q3": 1.364835150539875,
"ce_q4": 0.3760274866335094,
"ppl_q4": 1.4625834981799126,
"duration": 9589.747070789337
},
"valid": {
"ce": 0.26752446007124986,
"ppl": 1.3096886646898487,
"ce_q1": 0.17828437308721903,
"ppl_q1": 1.1965842382817329,
"ce_q2": 0.2359432058432434,
"ppl_q2": 1.2684225462660004,
"ce_q3": 0.29481099376195596,
"ppl_q3": 1.3464636576326587,
"ce_q4": 0.3610592697617374,
"ppl_q4": 1.440651973591575,
"duration": 362.9212381839752
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5372919216901064,
"ce": 0.27363305720314385,
"ppl": 1.3180202004313468,
"ce_q1": 0.18223593309149147,
"ppl_q1": 1.2013322665691375,
"ce_q2": 0.23964484233036637,
"ppl_q2": 1.2732633963823319,
"ce_q3": 0.30300518334284426,
"ppl_q3": 1.35809545814991,
"ce_q4": 0.36964626945927737,
"ppl_q4": 1.4539588932394982,
"duration": 9552.291424036026
},
"valid": {
"ce": 0.2650467896763283,
"ppl": 1.3063968676555007,
"ce_q1": 0.17553420921292487,
"ppl_q1": 1.193257446530499,
"ce_q2": 0.23342637029252475,
"ppl_q2": 1.2651877810683432,
"ce_q3": 0.29254751360114617,
"ppl_q3": 1.3433695699595198,
"ce_q4": 0.3586790639011166,
"ppl_q4": 1.4371557311166692,
"duration": 362.29028248786926
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5495444314219058,
"ce": 0.27388937419652937,
"ppl": 1.3182142223715783,
"ce_q1": 0.1811916080005467,
"ppl_q1": 1.200001169502735,
"ce_q2": 0.23959608913213015,
"ppl_q2": 1.2730867872834206,
"ce_q3": 0.3036364871356636,
"ppl_q3": 1.3587735990285874,
"ce_q4": 0.3711333122625947,
"ppl_q4": 1.455910117983818,
"duration": 9593.252102851868
},
"valid": {
"ce": 0.26282770837409586,
"ppl": 1.3034598193591154,
"ce_q1": 0.17277015226928494,
"ppl_q1": 1.1899251273915739,
"ce_q2": 0.2312564604644534,
"ppl_q2": 1.2624108082131495,
"ce_q3": 0.2905317946702619,
"ppl_q3": 1.3406218637394,
"ce_q4": 0.35675242920465106,
"ppl_q4": 1.4343435643594475,
"duration": 361.60309290885925
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5303192440792919,
"ce": 0.27048247469216585,
"ppl": 1.3137510415911675,
"ce_q1": 0.17822546218335628,
"ppl_q1": 1.1964569752216339,
"ce_q2": 0.23647218051552774,
"ppl_q2": 1.2691548042297363,
"ce_q3": 0.2999941988699138,
"ppl_q3": 1.3538470923900605,
"ce_q4": 0.36723805651068686,
"ppl_q4": 1.4502512238621712,
"duration": 9601.733191490173
},
"valid": {
"ce": 0.2607708179120776,
"ppl": 1.300733493853219,
"ce_q1": 0.17010203711216962,
"ppl_q1": 1.186716251735446,
"ce_q2": 0.22927546699213075,
"ppl_q2": 1.2598709954491145,
"ce_q3": 0.2884308844804764,
"ppl_q3": 1.3377633547481103,
"ce_q4": 0.35527488268628904,
"ppl_q4": 1.4321544864509679,
"duration": 362.8330523967743
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5436296821683645,
"ce": 0.27080439947731794,
"ppl": 1.3140050785541535,
"ce_q1": 0.17712718484923243,
"ppl_q1": 1.1950417374372482,
"ce_q2": 0.2365416384395212,
"ppl_q2": 1.2691017340421678,
"ce_q3": 0.30075699695944785,
"ppl_q3": 1.3546714680194856,
"ce_q4": 0.36879177782684563,
"ppl_q4": 1.4522535247206687,
"duration": 9603.792863368988
},
"valid": {
"ce": 0.25855125034157234,
"ppl": 1.2978112154369112,
"ce_q1": 0.16785943555303767,
"ppl_q1": 1.1840270546418201,
"ce_q2": 0.22702152498915226,
"ppl_q2": 1.2570037253295319,
"ce_q3": 0.28658432390870925,
"ppl_q3": 1.3352524117578435,
"ce_q4": 0.3527397136145,
"ppl_q4": 1.4284764648992805,
"duration": 362.80742144584656
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5256168953180314,
"ce": 0.26701043706387284,
"ppl": 1.309049612879753,
"ce_q1": 0.17353531206399203,
"ppl_q1": 1.1907625480890274,
"ce_q2": 0.2330456952676177,
"ppl_q2": 1.264704429924488,
"ce_q3": 0.29685995550081135,
"ppl_q3": 1.3494563950300216,
"ce_q4": 0.3646007853522897,
"ppl_q4": 1.4461578189730644,
"duration": 9513.590850114822
},
"valid": {
"ce": 0.2564406213881094,
"ppl": 1.29503724695761,
"ce_q1": 0.1656135074511359,
"ppl_q1": 1.181341039983532,
"ce_q2": 0.22491439733701415,
"ppl_q2": 1.2543214182310467,
"ce_q3": 0.2845413771611226,
"ppl_q3": 1.3324900020526935,
"ce_q4": 0.3506932043576542,
"ppl_q4": 1.4255086832408663,
"duration": 359.1641058921814
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5397710645273328,
"ce": 0.2670633195117116,
"ppl": 1.3092050889134408,
"ce_q1": 0.1732292026989162,
"ppl_q1": 1.1904190055131911,
"ce_q2": 0.23342717848345637,
"ppl_q2": 1.265246787428856,
"ce_q3": 0.2967667815387249,
"ppl_q3": 1.3493901955485343,
"ce_q4": 0.3648301157876849,
"ppl_q4": 1.4467548802495003,
"duration": 9521.433192968369
},
"valid": {
"ce": 0.2550391122887406,
"ppl": 1.2931905924519407,
"ce_q1": 0.16405439093897614,
"ppl_q1": 1.1794758657865887,
"ce_q2": 0.223558688465553,
"ppl_q2": 1.252597516096091,
"ce_q3": 0.2832572328138955,
"ppl_q3": 1.3307468830784666,
"ce_q4": 0.3492861380682716,
"ppl_q4": 1.4234507581855678,
"duration": 359.73581171035767
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5273035378232598,
"ce": 0.26412027855589987,
"ppl": 1.3050647683739662,
"ce_q1": 0.17033208943344652,
"ppl_q1": 1.1868622980713843,
"ce_q2": 0.23045820822194218,
"ppl_q2": 1.2612539411187171,
"ce_q3": 0.2938903398439288,
"ppl_q3": 1.345190036058426,
"ce_q4": 0.3618004768565297,
"ppl_q4": 1.4417528423070907,
"duration": 9522.932149648666
},
"valid": {
"ce": 0.2535136636299423,
"ppl": 1.2911919325212888,
"ce_q1": 0.16210570789967912,
"ppl_q1": 1.177155189876315,
"ce_q2": 0.22193231075247632,
"ppl_q2": 1.2505319556103478,
"ce_q3": 0.2818804366301887,
"ppl_q3": 1.328893451751033,
"ce_q4": 0.34813620074640345,
"ppl_q4": 1.4217831047275398,
"duration": 359.9517922401428
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5358553732335567,
"ce": 0.26297346629202367,
"ppl": 1.3035757108926773,
"ce_q1": 0.16872410270012916,
"ppl_q1": 1.1849369418025018,
"ce_q2": 0.22899346644431354,
"ppl_q2": 1.25940067589283,
"ce_q3": 0.29335827129706743,
"ppl_q3": 1.3444820920825005,
"ce_q4": 0.36081802381575107,
"ppl_q4": 1.440412820994854,
"duration": 9520.848494291306
},
"valid": {
"ce": 0.2524017829306518,
"ppl": 1.2897216911557354,
"ce_q1": 0.16064767765847943,
"ppl_q1": 1.1754137911374056,
"ce_q2": 0.2205624820876725,
"ppl_q2": 1.2487894251376768,
"ce_q3": 0.2810051771281641,
"ppl_q3": 1.3276908382584778,
"ce_q4": 0.34739179758331445,
"ppl_q4": 1.4206779757632484,
"duration": 359.9456934928894
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5356026580929756,
"ce": 0.2597531125359237,
"ppl": 1.299555616736412,
"ce_q1": 0.16579502180311828,
"ppl_q1": 1.1815283535718917,
"ce_q2": 0.22548220401629807,
"ppl_q2": 1.2551070806384086,
"ce_q3": 0.29003081101924183,
"ppl_q3": 1.3402505736351014,
"ce_q4": 0.35770441375114026,
"ppl_q4": 1.4363294315338135,
"duration": 9517.163825035095
},
"valid": {
"ce": 0.25014522898046276,
"ppl": 1.2867922284935094,
"ce_q1": 0.1584996507514881,
"ppl_q1": 1.1728712320327759,
"ce_q2": 0.21853658047657978,
"ppl_q2": 1.2462464389921744,
"ce_q3": 0.2786373801623719,
"ppl_q3": 1.3245291151577914,
"ce_q4": 0.34490730641763423,
"ppl_q4": 1.417119739930841,
"duration": 360.22341680526733
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5350262980908156,
"ce": 0.25812198682129384,
"ppl": 1.2972108287215234,
"ce_q1": 0.1639258794002235,
"ppl_q1": 1.1792037620544433,
"ce_q2": 0.2241402559094131,
"ppl_q2": 1.2532524604201316,
"ce_q3": 0.2885113680884242,
"ppl_q3": 1.3379627665281295,
"ce_q4": 0.3559104430042207,
"ppl_q4": 1.4333122403025627,
"duration": 9526.316365480423
},
"valid": {
"ce": 0.2493405983417849,
"ppl": 1.285740259327466,
"ce_q1": 0.15726630408552628,
"ppl_q1": 1.1714072031310843,
"ce_q2": 0.21789310561327996,
"ppl_q2": 1.2454326590405236,
"ce_q3": 0.2779476395513438,
"ppl_q3": 1.323596076120304,
"ce_q4": 0.3442553402502326,
"ppl_q4": 1.4161833720871164,
"duration": 359.8578016757965
},
"evaluate": {
"duration": 0.00048089027404785156
},
"generate": {
"rtf": 0.1425724983215332,
"duration": 7.397846221923828
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5344072869345545,
"ce": 0.25534614687785506,
"ppl": 1.2935579895377158,
"ce_q1": 0.16182335501164197,
"ppl_q1": 1.1767336027622224,
"ce_q2": 0.2219313066508621,
"ppl_q2": 1.2504770302176476,
"ce_q3": 0.2851938751935959,
"ppl_q3": 1.3333959483504296,
"ce_q4": 0.3524360497109592,
"ppl_q4": 1.428145908176899,
"duration": 9505.303801774979
},
"valid": {
"ce": 0.24762491240531584,
"ppl": 1.2835041028034837,
"ce_q1": 0.15565845558914956,
"ppl_q1": 1.169505753094637,
"ce_q2": 0.2159623706453963,
"ppl_q2": 1.2429962746704681,
"ce_q3": 0.2763731054301503,
"ppl_q3": 1.321482249453098,
"ce_q4": 0.3425057111661645,
"ppl_q4": 1.4136614105369472,
"duration": 359.8410291671753
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5475789905637503,
"ce": 0.2557172976210713,
"ppl": 1.2941320454478265,
"ce_q1": 0.1614206156115979,
"ppl_q1": 1.1762497451901437,
"ce_q2": 0.22231142236292362,
"ppl_q2": 1.250964602291584,
"ce_q3": 0.2860571291409433,
"ppl_q3": 1.3347246972322464,
"ce_q4": 0.35308002268895505,
"ppl_q4": 1.4293945796489715,
"duration": 9515.96857047081
},
"valid": {
"ce": 0.24678222052281415,
"ppl": 1.2824011497859713,
"ce_q1": 0.1545967455906204,
"ppl_q1": 1.168249379230451,
"ce_q2": 0.21509166854091838,
"ppl_q2": 1.2418932673297352,
"ce_q3": 0.27556955597445937,
"ppl_q3": 1.3203984076463724,
"ce_q4": 0.3418709149089041,
"ppl_q4": 1.4127335910555683,
"duration": 359.51284098625183
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.544369428113103,
"ce": 0.25431034310162065,
"ppl": 1.292094294011593,
"ce_q1": 0.15954916645772754,
"ppl_q1": 1.1739847147464753,
"ce_q2": 0.22019167565554382,
"ppl_q2": 1.2481818380951881,
"ce_q3": 0.2850243282802403,
"ppl_q3": 1.3330603014230729,
"ce_q4": 0.3524762026928365,
"ppl_q4": 1.4280194517970086,
"duration": 9521.965310811996
},
"valid": {
"ce": 0.24541866647291788,
"ppl": 1.2806246129772332,
"ce_q1": 0.15318822115659714,
"ppl_q1": 1.166583023493803,
"ce_q2": 0.2138220927194704,
"ppl_q2": 1.2402959367896937,
"ce_q3": 0.274175078902818,
"ppl_q3": 1.3185257338270355,
"ce_q4": 0.3404892788657659,
"ppl_q4": 1.410742003706437,
"duration": 360.1158468723297
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5704672664999962,
"ce": 0.2547891466207802,
"ppl": 1.292769466817379,
"ce_q1": 0.15965367713570594,
"ppl_q1": 1.174122365295887,
"ce_q2": 0.22078421056643127,
"ppl_q2": 1.2489683644771576,
"ce_q3": 0.28512962044030427,
"ppl_q3": 1.3332771819233895,
"ce_q4": 0.35358907787129285,
"ppl_q4": 1.4297208489179611,
"duration": 9536.582916736603
},
"valid": {
"ce": 0.2451463624646392,
"ppl": 1.2802674423290203,
"ce_q1": 0.1526368566894833,
"ppl_q1": 1.1659329571301424,
"ce_q2": 0.21365947417820555,
"ppl_q2": 1.240086910090869,
"ce_q3": 0.27400606361371055,
"ppl_q3": 1.318293100670923,
"ce_q4": 0.34028305924391444,
"ppl_q4": 1.4104415902608558,
"duration": 361.07709193229675
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5519527767598629,
"ce": 0.25307825837656855,
"ppl": 1.290546900510788,
"ce_q1": 0.15773487233929337,
"ppl_q1": 1.17184512424469,
"ce_q2": 0.21900815995037556,
"ppl_q2": 1.2467407024502755,
"ce_q3": 0.28379577936604616,
"ppl_q3": 1.3314958873391152,
"ce_q4": 0.3517742223292589,
"ppl_q4": 1.4271460437178611,
"duration": 9517.157433271408
},
"valid": {
"ce": 0.2433236206445513,
"ppl": 1.2779125956040394,
"ce_q1": 0.15054505723941175,
"ppl_q1": 1.1634739486477044,
"ce_q2": 0.2116720311437981,
"ppl_q2": 1.2376048549821106,
"ce_q3": 0.27243701198810266,
"ppl_q3": 1.3162088952487028,
"ce_q4": 0.338640377302713,
"ppl_q4": 1.408096657523626,
"duration": 360.1750862598419
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5535622903853655,
"ce": 0.25230341647937893,
"ppl": 1.2895389752984048,
"ce_q1": 0.15685477450862526,
"ppl_q1": 1.1707977665662765,
"ce_q2": 0.21831004438921808,
"ppl_q2": 1.2458406186699866,
"ce_q3": 0.28324105164036156,
"ppl_q3": 1.3307670249938965,
"ce_q4": 0.35080779671669005,
"ppl_q4": 1.4258026565909385,
"duration": 9515.998623132706
},
"valid": {
"ce": 0.24243429538947117,
"ppl": 1.276759606373461,
"ce_q1": 0.14961987177405175,
"ppl_q1": 1.162385119667536,
"ce_q2": 0.21068576440403733,
"ppl_q2": 1.2363704563696174,
"ce_q3": 0.2715654976760285,
"ppl_q3": 1.3150421818600426,
"ce_q4": 0.33786605600314806,
"ppl_q4": 1.406982400749303,
"duration": 359.7568485736847
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5734196212291718,
"ce": 0.2512887836024165,
"ppl": 1.2882268325686455,
"ce_q1": 0.1558698156978935,
"ppl_q1": 1.1696524586081505,
"ce_q2": 0.21735065659880637,
"ppl_q2": 1.2446533225774765,
"ce_q3": 0.28217829593643545,
"ppl_q3": 1.3293246050477028,
"ce_q4": 0.34975636619329453,
"ppl_q4": 1.4242641864418983,
"duration": 9525.4554002285
},
"valid": {
"ce": 0.24138385312089436,
"ppl": 1.2753967393802692,
"ce_q1": 0.14845384346156182,
"ppl_q1": 1.1610137782519376,
"ce_q2": 0.2096489432114589,
"ppl_q2": 1.235067696510991,
"ce_q3": 0.27045898733637,
"ppl_q3": 1.3135651199123528,
"ce_q4": 0.33697363771969757,
"ppl_q4": 1.4057027840916114,
"duration": 359.8495628833771
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5840627053380012,
"ce": 0.2517865260466933,
"ppl": 1.2890241292715072,
"ce_q1": 0.15549812090583146,
"ppl_q1": 1.169280726313591,
"ce_q2": 0.217613572595641,
"ppl_q2": 1.2451145648956299,
"ce_q3": 0.2828731698282063,
"ppl_q3": 1.3304364619255067,
"ce_q4": 0.3511612404361367,
"ppl_q4": 1.426550364792347,
"duration": 9522.250625610352
},
"valid": {
"ce": 0.24041013872321648,
"ppl": 1.2741427768634845,
"ce_q1": 0.14732468778951258,
"ppl_q1": 1.159694943246962,
"ce_q2": 0.20880817546497418,
"ppl_q2": 1.234016806264467,
"ce_q3": 0.2696859886563277,
"ppl_q3": 1.3125430752959433,
"ce_q4": 0.3358217015673843,
"ppl_q4": 1.4040598190283473,
"duration": 360.85492873191833
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5932098316699267,
"ce": 0.24997816063836217,
"ppl": 1.2865897563099862,
"ce_q1": 0.1538148140460253,
"ppl_q1": 1.1672510678768158,
"ce_q2": 0.21599062044918538,
"ppl_q2": 1.24297774964571,
"ce_q3": 0.2811757633052766,
"ppl_q3": 1.328074213206768,
"ce_q4": 0.3489314452596009,
"ppl_q4": 1.4232663878798484,
"duration": 9530.121540307999
},
"valid": {
"ce": 0.2395599106255966,
"ppl": 1.2730484069148196,
"ce_q1": 0.1465721991431864,
"ppl_q1": 1.1588151590733589,
"ce_q2": 0.2078702820441391,
"ppl_q2": 1.2328497261940679,
"ce_q3": 0.2687099756130689,
"ppl_q3": 1.3112452694132357,
"ce_q4": 0.3350871848531916,
"ppl_q4": 1.4030167573614964,
"duration": 360.1522071361542
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.5956792443618179,
"ce": 0.24838823240995406,
"ppl": 1.2844244130253792,
"ce_q1": 0.1525679118419066,
"ppl_q1": 1.165747564971447,
"ce_q2": 0.21478954068757594,
"ppl_q2": 1.241436672747135,
"ce_q3": 0.2792185950372368,
"ppl_q3": 1.325300565481186,
"ce_q4": 0.3469768827762455,
"ppl_q4": 1.4201808007359504,
"duration": 9524.631300210953
},
"valid": {
"ce": 0.23872524367857584,
"ppl": 1.2719671816765508,
"ce_q1": 0.14549196266298053,
"ppl_q1": 1.157549474812761,
"ce_q2": 0.20708231590216672,
"ppl_q2": 1.2318618765360192,
"ce_q3": 0.2680366391999812,
"ppl_q3": 1.3103452996362615,
"ce_q4": 0.33429006496562236,
"ppl_q4": 1.401870223540294,
"duration": 359.5872597694397
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6259121421352029,
"ce": 0.2509105849824846,
"ppl": 1.2876138908863068,
"ce_q1": 0.15371049094200134,
"ppl_q1": 1.1670769104957581,
"ce_q2": 0.21673321747034788,
"ppl_q2": 1.2437935125231743,
"ce_q3": 0.2821627798490226,
"ppl_q3": 1.3291475368738175,
"ce_q4": 0.3510358522422612,
"ppl_q4": 1.4258298891782761,
"duration": 9531.088446617126
},
"valid": {
"ce": 0.23873222949384135,
"ppl": 1.2719656938238988,
"ce_q1": 0.1450868081065673,
"ppl_q1": 1.157067700277401,
"ce_q2": 0.2068327178683462,
"ppl_q2": 1.2315466162524646,
"ce_q3": 0.26822042418054387,
"ppl_q3": 1.310575492774384,
"ce_q4": 0.3347889731956434,
"ppl_q4": 1.4025674107708508,
"duration": 360.09592270851135
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6269686085805297,
"ce": 0.24783911228738725,
"ppl": 1.2838349602222443,
"ce_q1": 0.1516694893669337,
"ppl_q1": 1.1647503933906556,
"ce_q2": 0.21395725398883222,
"ppl_q2": 1.2404760385155678,
"ce_q3": 0.27887285071611406,
"ppl_q3": 1.324999911546707,
"ce_q4": 0.34685685462504623,
"ppl_q4": 1.420261112689972,
"duration": 9533.307350635529
},
"valid": {
"ce": 0.23706307743169083,
"ppl": 1.269828897488268,
"ce_q1": 0.1434131178863441,
"ppl_q1": 1.155119308942481,
"ce_q2": 0.20534558792280244,
"ppl_q2": 1.2297039650663544,
"ce_q3": 0.2666156414566161,
"ppl_q3": 1.3084602506854865,
"ce_q4": 0.33287796566757977,
"ppl_q4": 1.399867706660983,
"duration": 360.5455119609833
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6271612166985869,
"ce": 0.24786986844241618,
"ppl": 1.283757869064808,
"ce_q1": 0.15094023028761147,
"ppl_q1": 1.1638670492768288,
"ce_q2": 0.21374938612803818,
"ppl_q2": 1.240128959774971,
"ce_q3": 0.2793254300914705,
"ppl_q3": 1.3254130818247796,
"ce_q4": 0.3474644286036491,
"ppl_q4": 1.42090361058712,
"duration": 9529.41432762146
},
"valid": {
"ce": 0.2368563413619995,
"ppl": 1.269559409044966,
"ce_q1": 0.14331292964612383,
"ppl_q1": 1.1550041120263594,
"ce_q2": 0.20511469556183753,
"ppl_q2": 1.2294130943998505,
"ce_q3": 0.2663348641576646,
"ppl_q3": 1.3080807260320158,
"ce_q4": 0.3326628698578364,
"ppl_q4": 1.3995511727997019,
"duration": 360.76744651794434
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6385511268824339,
"ce": 0.24584784270077945,
"ppl": 1.2811622342467308,
"ce_q1": 0.1497510178461671,
"ppl_q1": 1.1624547756314279,
"ce_q2": 0.21202525600045918,
"ppl_q2": 1.237964022397995,
"ce_q3": 0.2768012195788324,
"ppl_q3": 1.3221359432935715,
"ce_q4": 0.3448138787560165,
"ppl_q4": 1.4171970781087875,
"duration": 9524.562409877777
},
"valid": {
"ce": 0.23563965966429892,
"ppl": 1.2679976028732107,
"ce_q1": 0.1418514523325087,
"ppl_q1": 1.1533005026322376,
"ce_q2": 0.20397380305619178,
"ppl_q2": 1.2279938942269435,
"ce_q3": 0.26519738232033163,
"ppl_q3": 1.306580148165739,
"ce_q4": 0.3315360000993632,
"ppl_q4": 1.397956037823158,
"duration": 360.3846733570099
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6360174294635653,
"ce": 0.24407700955867767,
"ppl": 1.2787973175644876,
"ce_q1": 0.1479816423766315,
"ppl_q1": 1.1603798078298568,
"ce_q2": 0.21035069748945534,
"ppl_q2": 1.2358509694933892,
"ce_q3": 0.2752209755368531,
"ppl_q3": 1.3198883423805237,
"ce_q4": 0.3427547232396901,
"ppl_q4": 1.414001984000206,
"duration": 9642.434718847275
},
"valid": {
"ce": 0.23524645197240612,
"ppl": 1.2674962236911436,
"ce_q1": 0.14150380003678648,
"ppl_q1": 1.1528948122941995,
"ce_q2": 0.2034214210661152,
"ppl_q2": 1.2273095393482643,
"ce_q3": 0.26484976482542255,
"ppl_q3": 1.3061266865911363,
"ce_q4": 0.3312108271484134,
"ppl_q4": 1.3975031707860246,
"duration": 385.52757596969604
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6409649724066258,
"ce": 0.2456396240890026,
"ppl": 1.2808832069635392,
"ce_q1": 0.14883658679947256,
"ppl_q1": 1.1613854657411575,
"ce_q2": 0.21165752100199461,
"ppl_q2": 1.2375192747712136,
"ce_q3": 0.27659394700825213,
"ppl_q3": 1.3218081101179122,
"ce_q4": 0.3454704398550093,
"ppl_q4": 1.4180844410657882,
"duration": 9668.847463130951
},
"valid": {
"ce": 0.23525820766823202,
"ppl": 1.2674960909010489,
"ce_q1": 0.14089244924768618,
"ppl_q1": 1.1521821595445465,
"ce_q2": 0.20362399593938754,
"ppl_q2": 1.2275536452667624,
"ce_q3": 0.26465610311001164,
"ppl_q3": 1.3058527406257918,
"ce_q4": 0.33186028124410893,
"ppl_q4": 1.3983763637422006,
"duration": 363.28456354141235
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.664245718382299,
"ce": 0.243544303458184,
"ppl": 1.2781934062242508,
"ce_q1": 0.14736363627016544,
"ppl_q1": 1.1596874266862869,
"ce_q2": 0.21001652750186622,
"ppl_q2": 1.235504131793976,
"ce_q3": 0.2746094092391431,
"ppl_q3": 1.319182243347168,
"ce_q4": 0.34218764064088464,
"ppl_q4": 1.4133317279219628,
"duration": 9572.143107414246
},
"valid": {
"ce": 0.23389616495446314,
"ppl": 1.2657610811764681,
"ce_q1": 0.139870255148109,
"ppl_q1": 1.1509948078590104,
"ce_q2": 0.2021081698468969,
"ppl_q2": 1.2256792979904367,
"ce_q3": 0.2635032166785832,
"ppl_q3": 1.3043419137785706,
"ce_q4": 0.3301030240858657,
"ppl_q4": 1.3959188385854793,
"duration": 362.07116055488586
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6577543443962932,
"ce": 0.24355571600049733,
"ppl": 1.2783152058720588,
"ce_q1": 0.14672903286665678,
"ppl_q1": 1.1589760918021201,
"ce_q2": 0.2094849065374583,
"ppl_q2": 1.234888660490513,
"ce_q3": 0.2749556212387979,
"ppl_q3": 1.3197916320562362,
"ce_q4": 0.34305330453068017,
"ppl_q4": 1.4148812156915664,
"duration": 9564.110896110535
},
"valid": {
"ce": 0.23368493410982663,
"ppl": 1.265483186214785,
"ce_q1": 0.13961451047960716,
"ppl_q1": 1.1506915846957435,
"ce_q2": 0.20201391208020947,
"ppl_q2": 1.2255540346797509,
"ce_q3": 0.26324535349879086,
"ppl_q3": 1.3039913298208503,
"ce_q4": 0.3298659656621233,
"ppl_q4": 1.395579461809955,
"duration": 362.3992705345154
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6778192021995783,
"ce": 0.2440447256192565,
"ppl": 1.2787858218550683,
"ce_q1": 0.14691940317675473,
"ppl_q1": 1.1591414462924003,
"ce_q2": 0.2097668897304684,
"ppl_q2": 1.2351483046412468,
"ce_q3": 0.2754211965985596,
"ppl_q3": 1.3201775425076485,
"ce_q4": 0.3440714124441147,
"ppl_q4": 1.4159864671826363,
"duration": 9545.63279247284
},
"valid": {
"ce": 0.2326044343128989,
"ppl": 1.2641042229495472,
"ce_q1": 0.1384782603458513,
"ppl_q1": 1.1493786392332632,
"ce_q2": 0.20091355592012405,
"ppl_q2": 1.2241957821423495,
"ce_q3": 0.26224804509289656,
"ppl_q3": 1.3026782787298854,
"ce_q4": 0.3287778823058816,
"ppl_q4": 1.3940396927580048,
"duration": 360.22646832466125
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6707401871681213,
"ce": 0.23956566899642348,
"ppl": 1.2730193123817444,
"ce_q1": 0.14374634724669158,
"ppl_q1": 1.155434732079506,
"ce_q2": 0.20624254284799098,
"ppl_q2": 1.230749096930027,
"ce_q3": 0.27056824281439185,
"ppl_q3": 1.3137432911396028,
"ce_q4": 0.3377055443301797,
"ppl_q4": 1.4069183074235916,
"duration": 9558.510349750519
},
"valid": {
"ce": 0.23204161217318306,
"ppl": 1.263381180883963,
"ce_q1": 0.13786554034752183,
"ppl_q1": 1.14866596837587,
"ce_q2": 0.20020800065013428,
"ppl_q2": 1.2233191140090363,
"ce_q3": 0.2617034689535069,
"ppl_q3": 1.3019578411609312,
"ce_q4": 0.32838943808139126,
"ppl_q4": 1.393486988695362,
"duration": 361.29156398773193
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7080844983011484,
"ce": 0.24309088224731384,
"ppl": 1.2774566966295242,
"ce_q1": 0.14555208410322668,
"ppl_q1": 1.1574990980625153,
"ce_q2": 0.20890174414776266,
"ppl_q2": 1.2339593514800071,
"ce_q3": 0.2747854264099151,
"ppl_q3": 1.3192665134072303,
"ce_q4": 0.34312427481636404,
"ppl_q4": 1.4144429289698601,
"duration": 9549.453770637512
},
"valid": {
"ce": 0.23211610722768156,
"ppl": 1.2634691739384132,
"ce_q1": 0.1376931574902957,
"ppl_q1": 1.1484606069854544,
"ce_q2": 0.20021181723362283,
"ppl_q2": 1.2233177861080895,
"ce_q3": 0.26189691724279257,
"ppl_q3": 1.3022053286999087,
"ce_q4": 0.3286625397733495,
"ppl_q4": 1.3938617298874674,
"duration": 361.47618532180786
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.6983074579387903,
"ce": 0.24082991381548344,
"ppl": 1.274703004717827,
"ce_q1": 0.14447409295849503,
"ppl_q1": 1.156317334473133,
"ce_q2": 0.2070563982259482,
"ppl_q2": 1.2318231120705605,
"ce_q3": 0.27201961440220473,
"ppl_q3": 1.3157302103042603,
"ce_q4": 0.3397695492412895,
"ppl_q4": 1.4099344087839127,
"duration": 9994.90785908699
},
"valid": {
"ce": 0.2309750067659571,
"ppl": 1.262012537521652,
"ce_q1": 0.13666374311794208,
"ppl_q1": 1.1472711864906022,
"ce_q2": 0.19922688490227808,
"ppl_q2": 1.2221039578884463,
"ce_q3": 0.2607280557291417,
"ppl_q3": 1.300660655468325,
"ce_q4": 0.327281353217137,
"ppl_q4": 1.3919113964974126,
"duration": 380.41486859321594
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7071668354123831,
"ce": 0.24068747078999878,
"ppl": 1.2744610707759858,
"ce_q1": 0.14407572587020695,
"ppl_q1": 1.15583081138134,
"ce_q2": 0.2071608739681542,
"ppl_q2": 1.2319029974341393,
"ce_q3": 0.2718148806579411,
"ppl_q3": 1.3153884276747703,
"ce_q4": 0.3396984034702182,
"ppl_q4": 1.409703156709671,
"duration": 9756.736243486404
},
"valid": {
"ce": 0.2309223112614849,
"ppl": 1.2619432995590982,
"ce_q1": 0.13653600805356533,
"ppl_q1": 1.1471215999579127,
"ce_q2": 0.19912380149847345,
"ppl_q2": 1.2219740876668617,
"ce_q3": 0.26079627569717695,
"ppl_q3": 1.3007519863828827,
"ce_q4": 0.3272331573917896,
"ppl_q4": 1.3918390243868284,
"duration": 368.5292272567749
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7122122403234243,
"ce": 0.23930577029660344,
"ppl": 1.272752983033657,
"ce_q1": 0.14276826794631778,
"ppl_q1": 1.1543263272047042,
"ce_q2": 0.20552064482867718,
"ppl_q2": 1.2299229969978334,
"ce_q3": 0.2703877854980528,
"ppl_q3": 1.3135577340126037,
"ce_q4": 0.3385463819168508,
"ppl_q4": 1.4082771706581116,
"duration": 9719.253911495209
},
"valid": {
"ce": 0.23022525050217593,
"ppl": 1.2610534761525407,
"ce_q1": 0.13569344844244705,
"ppl_q1": 1.1461462823650506,
"ce_q2": 0.19841003465124324,
"ppl_q2": 1.2210852752757977,
"ce_q3": 0.26008117425290844,
"ppl_q3": 1.2998103823842881,
"ce_q4": 0.32671634796299515,
"ppl_q4": 1.3911226504965672,
"duration": 360.2000744342804
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7181495098769665,
"ce": 0.2370236859191209,
"ppl": 1.2696498561501504,
"ce_q1": 0.14120216728560628,
"ppl_q1": 1.1524359884262085,
"ce_q2": 0.20351344673335553,
"ppl_q2": 1.22729424315691,
"ce_q3": 0.2681648657210171,
"ppl_q3": 1.3104434042572974,
"ce_q4": 0.3352142642848194,
"ppl_q4": 1.4031092252135278,
"duration": 9752.171288490295
},
"valid": {
"ce": 0.22986835165868832,
"ppl": 1.2605982324745082,
"ce_q1": 0.13534259253853484,
"ppl_q1": 1.145739893370037,
"ce_q2": 0.1980127974212924,
"ppl_q2": 1.220601871043821,
"ce_q3": 0.25968008356381067,
"ppl_q3": 1.2992816408978234,
"ce_q4": 0.3264379331582709,
"ppl_q4": 1.3907207884366,
"duration": 359.7213315963745
},
"evaluate": {
"duration": 0.0004868507385253906
},
"generate": {
"rtf": 0.13417162895202636,
"duration": 6.3338494300842285
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7458941115438938,
"ce": 0.2425526543110609,
"ppl": 1.276889626443386,
"ce_q1": 0.14413494194485246,
"ppl_q1": 1.1559125598073006,
"ce_q2": 0.2080324027650058,
"ppl_q2": 1.232991351366043,
"ce_q3": 0.2743159428536892,
"ppl_q3": 1.3187612901329995,
"ce_q4": 0.34372732899710534,
"ppl_q4": 1.4155418301820755,
"duration": 9700.450702428818
},
"valid": {
"ce": 0.22964197453818744,
"ppl": 1.2603011267094673,
"ce_q1": 0.13506576305703272,
"ppl_q1": 1.145417666133446,
"ce_q2": 0.19776223552755162,
"ppl_q2": 1.2202835430072834,
"ce_q3": 0.25956722320635106,
"ppl_q3": 1.299124062815799,
"ce_q4": 0.32617267966270447,
"ppl_q4": 1.390332289888889,
"duration": 360.6649878025055
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7595065858215093,
"ce": 0.24065504398941995,
"ppl": 1.2743447959423064,
"ce_q1": 0.1429246997386217,
"ppl_q1": 1.154476759672165,
"ce_q2": 0.20639702497422696,
"ppl_q2": 1.2309041517972945,
"ce_q3": 0.2722774493061006,
"ppl_q3": 1.3158954713344575,
"ce_q4": 0.34102100249379874,
"ppl_q4": 1.4114456915855407,
"duration": 9529.465988874435
},
"valid": {
"ce": 0.22926970090292678,
"ppl": 1.2598293959339963,
"ce_q1": 0.13459759384770936,
"ppl_q1": 1.1448792943471595,
"ce_q2": 0.19739679209416425,
"ppl_q2": 1.2198374814625028,
"ce_q3": 0.2591867259220232,
"ppl_q3": 1.298626478714279,
"ce_q4": 0.32589768571189687,
"ppl_q4": 1.3899421706984314,
"duration": 360.31201362609863
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7351434735059739,
"ce": 0.23938026629015804,
"ppl": 1.2727510742545127,
"ce_q1": 0.14172620253451168,
"ppl_q1": 1.1531024494767188,
"ce_q2": 0.2054664296582341,
"ppl_q2": 1.229805707871914,
"ce_q3": 0.27096363745629787,
"ppl_q3": 1.3142067841291427,
"ce_q4": 0.3393647952750325,
"ppl_q4": 1.4091091482639313,
"duration": 9539.187855243683
},
"valid": {
"ce": 0.22869904395900195,
"ppl": 1.259101620203332,
"ce_q1": 0.13400218126517308,
"ppl_q1": 1.1441895659965804,
"ce_q2": 0.1968119889497757,
"ppl_q2": 1.2191141707987725,
"ce_q3": 0.2585741540865053,
"ppl_q3": 1.2978223396252981,
"ce_q4": 0.3254078481393524,
"ppl_q4": 1.3892581870284262,
"duration": 359.8805067539215
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7548547839820385,
"ce": 0.23899226354435085,
"ppl": 1.2723530584573746,
"ce_q1": 0.14133981161378323,
"ppl_q1": 1.1526711270213128,
"ce_q2": 0.20458472933247684,
"ppl_q2": 1.2287503024339677,
"ce_q3": 0.27068992525339125,
"ppl_q3": 1.3139749676585197,
"ce_q4": 0.3393545893356204,
"ppl_q4": 1.4094223992824555,
"duration": 9542.971844911575
},
"valid": {
"ce": 0.22815483780224113,
"ppl": 1.2584095227567456,
"ce_q1": 0.1335570336897162,
"ppl_q1": 1.1436753031573719,
"ce_q2": 0.19643200320910803,
"ppl_q2": 1.2186425124542624,
"ce_q3": 0.2579797560089751,
"ppl_q3": 1.297049200987514,
"ce_q4": 0.3246505601873881,
"ppl_q4": 1.3881905275055124,
"duration": 368.03865933418274
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7593064209967851,
"ce": 0.23685456682741643,
"ppl": 1.2694467228055,
"ce_q1": 0.13991788394190371,
"ppl_q1": 1.1509653626680374,
"ce_q2": 0.2028427793905139,
"ppl_q2": 1.226467687189579,
"ce_q3": 0.2684141566194594,
"ppl_q3": 1.3107935539484024,
"ce_q4": 0.33624344670772555,
"ppl_q4": 1.4045857654213905,
"duration": 9580.192293643951
},
"valid": {
"ce": 0.2278020052781588,
"ppl": 1.2579596374608293,
"ce_q1": 0.13307934485470194,
"ppl_q1": 1.1431276934056342,
"ce_q2": 0.1959167003065725,
"ppl_q2": 1.2180069096480743,
"ce_q3": 0.25770771767519696,
"ppl_q3": 1.2966860261144517,
"ce_q4": 0.32450425832331936,
"ppl_q4": 1.3879840902135343,
"duration": 380.77603125572205
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7740668349564076,
"ce": 0.23690926843881607,
"ppl": 1.2695665367245674,
"ce_q1": 0.14018416186049582,
"ppl_q1": 1.1512908690571786,
"ce_q2": 0.20302358677983284,
"ppl_q2": 1.2267142446637154,
"ce_q3": 0.26843919563665986,
"ppl_q3": 1.3108944136500358,
"ce_q4": 0.3359901293106377,
"ppl_q4": 1.4043555800914764,
"duration": 10097.089985847473
},
"valid": {
"ce": 0.22762313202212128,
"ppl": 1.2577378719667844,
"ce_q1": 0.1328005560591251,
"ppl_q1": 1.1428058524675007,
"ce_q2": 0.1957149401872973,
"ppl_q2": 1.2177722318262993,
"ce_q3": 0.25755599735281137,
"ppl_q3": 1.2964891391464426,
"ce_q4": 0.3244210440146772,
"ppl_q4": 1.3878784572021872,
"duration": 380.9564025402069
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7629056445807219,
"ce": 0.23759560581296682,
"ppl": 1.2706120741963387,
"ce_q1": 0.14004144414514302,
"ppl_q1": 1.1511869466900826,
"ce_q2": 0.20307460083812476,
"ppl_q2": 1.226931110918522,
"ce_q3": 0.26914824870973825,
"ppl_q3": 1.3120183774232865,
"ce_q4": 0.33811812895536425,
"ppl_q4": 1.4077248179912567,
"duration": 9941.643844366074
},
"valid": {
"ce": 0.22723062015786955,
"ppl": 1.2572285570675814,
"ce_q1": 0.13235989726985556,
"ppl_q1": 1.1422934411447259,
"ce_q2": 0.19538095319950127,
"ppl_q2": 1.217345438426054,
"ce_q3": 0.25713647543629514,
"ppl_q3": 1.2959320469747615,
"ce_q4": 0.32404515505591525,
"ppl_q4": 1.3873321240461325,
"duration": 369.8635036945343
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7822054946124554,
"ce": 0.2374809791147709,
"ppl": 1.2704038944840432,
"ce_q1": 0.13979671021923423,
"ppl_q1": 1.1508849658966065,
"ce_q2": 0.20325931436382233,
"ppl_q2": 1.2271112378239633,
"ce_q3": 0.2688052276149392,
"ppl_q3": 1.311464338541031,
"ce_q4": 0.33806266306340693,
"ppl_q4": 1.4075241394042968,
"duration": 9753.883709430695
},
"valid": {
"ce": 0.22680127262314664,
"ppl": 1.256680597232867,
"ce_q1": 0.13173822007035907,
"ppl_q1": 1.1415773177448707,
"ce_q2": 0.194898527162739,
"ppl_q2": 1.2167490298234964,
"ce_q3": 0.25671091496567183,
"ppl_q3": 1.2953750498687164,
"ce_q4": 0.3238574330565296,
"ppl_q4": 1.3870616789105572,
"duration": 368.7049789428711
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.7903054953366518,
"ce": 0.2367863023430109,
"ppl": 1.2694587385058402,
"ce_q1": 0.1392606132775545,
"ppl_q1": 1.1502389285564423,
"ce_q2": 0.2027334346882999,
"ppl_q2": 1.2264285063147544,
"ce_q3": 0.26826757328025996,
"ppl_q3": 1.3107098459601403,
"ce_q4": 0.3368835870586336,
"ppl_q4": 1.405710391819477,
"duration": 9762.63434791565
},
"valid": {
"ce": 0.22626867682873447,
"ppl": 1.2560096798063833,
"ce_q1": 0.13152918969339963,
"ppl_q1": 1.1413356774969945,
"ce_q2": 0.1943574321420887,
"ppl_q2": 1.2160895730875716,
"ce_q3": 0.25616807226516025,
"ppl_q3": 1.294674186766902,
"ce_q4": 0.32302001345006726,
"ppl_q4": 1.3858960972556584,
"duration": 370.98861265182495
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8007361833155155,
"ce": 0.23663719480857254,
"ppl": 1.269249272108078,
"ce_q1": 0.1388839657269418,
"ppl_q1": 1.1497901789546012,
"ce_q2": 0.20259303681738675,
"ppl_q2": 1.2262300137281419,
"ce_q3": 0.2683315980695188,
"ppl_q3": 1.3107663362026214,
"ce_q4": 0.3367401777282357,
"ppl_q4": 1.4054936626553536,
"duration": 9874.321754693985
},
"valid": {
"ce": 0.2265099391718454,
"ppl": 1.2563036242617835,
"ce_q1": 0.1315399381933333,
"ppl_q1": 1.1413428481621077,
"ce_q2": 0.19479119060914726,
"ppl_q2": 1.2166080565392217,
"ce_q3": 0.25642215451107747,
"ppl_q3": 1.2949935922139808,
"ce_q4": 0.32328647507142416,
"ppl_q4": 1.3862528197373016,
"duration": 375.6848351955414
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8122369261234998,
"ce": 0.23792855026200413,
"ppl": 1.2708076131343842,
"ce_q1": 0.13978421782329678,
"ppl_q1": 1.1508216080665588,
"ce_q2": 0.2037396509498358,
"ppl_q2": 1.227577201128006,
"ce_q3": 0.2696165804602206,
"ppl_q3": 1.312350681900978,
"ce_q4": 0.33857375050336125,
"ppl_q4": 1.407835367023945,
"duration": 9884.318295240402
},
"valid": {
"ce": 0.22572990101349505,
"ppl": 1.2553173182885857,
"ce_q1": 0.13091754215427592,
"ppl_q1": 1.140630971027326,
"ce_q2": 0.19368831605850895,
"ppl_q2": 1.215258945392657,
"ce_q3": 0.2557466396048099,
"ppl_q3": 1.2941076197201693,
"ce_q4": 0.3225671030298064,
"ppl_q4": 1.3852484437483776,
"duration": 372.3847210407257
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.793204349860549,
"ce": 0.23371777066215874,
"ppl": 1.2655342619419099,
"ce_q1": 0.13718466015718878,
"ppl_q1": 1.147833851635456,
"ce_q2": 0.20006070529855788,
"ppl_q2": 1.2231077144742013,
"ce_q3": 0.2650848253462464,
"ppl_q3": 1.306504865348339,
"ce_q4": 0.33254089166224005,
"ppl_q4": 1.3995740624070168,
"duration": 9840.461713790894
},
"valid": {
"ce": 0.22548739687551425,
"ppl": 1.2550196496746209,
"ce_q1": 0.13059186638344691,
"ppl_q1": 1.1402611370328106,
"ce_q2": 0.19367442232898519,
"ppl_q2": 1.2152509855318674,
"ce_q3": 0.25537342813950553,
"ppl_q3": 1.2936262842975086,
"ce_q4": 0.32230987239487563,
"ppl_q4": 1.3849103662032116,
"duration": 371.8497664928436
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8240224216729403,
"ce": 0.23315792963653803,
"ppl": 1.2647923899292945,
"ce_q1": 0.13675606906041504,
"ppl_q1": 1.1473355682492257,
"ce_q2": 0.19954606886580586,
"ppl_q2": 1.2224380002021789,
"ce_q3": 0.2642233612984419,
"ppl_q3": 1.305375330865383,
"ce_q4": 0.33210621976852417,
"ppl_q4": 1.3988679733872413,
"duration": 9806.019900560379
},
"valid": {
"ce": 0.22566265207302721,
"ppl": 1.255235181579107,
"ce_q1": 0.13060598410194432,
"ppl_q1": 1.1402720001679432,
"ce_q2": 0.19378430151109455,
"ppl_q2": 1.2153825624079644,
"ce_q3": 0.255592904324773,
"ppl_q3": 1.2939109334462806,
"ce_q4": 0.3226674191559417,
"ppl_q4": 1.3853962119621566,
"duration": 369.0384819507599
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8544749879091978,
"ce": 0.23668315253779293,
"ppl": 1.269325015425682,
"ce_q1": 0.13880182195454835,
"ppl_q1": 1.1497194021940231,
"ce_q2": 0.20259497648850083,
"ppl_q2": 1.2262280118465423,
"ce_q3": 0.2684658388197422,
"ppl_q3": 1.3109768298268318,
"ce_q4": 0.3368699716813862,
"ppl_q4": 1.405703274011612,
"duration": 9878.42060136795
},
"valid": {
"ce": 0.22485628686373746,
"ppl": 1.2542132893695106,
"ce_q1": 0.12989867049493367,
"ppl_q1": 1.1394610555866096,
"ce_q2": 0.19280013177968278,
"ppl_q2": 1.214174518102332,
"ce_q3": 0.2548665206266355,
"ppl_q3": 1.2929603887509695,
"ce_q4": 0.32185981997960733,
"ppl_q4": 1.384264912786363,
"duration": 370.40525102615356
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8379982327222824,
"ce": 0.23464179111644626,
"ppl": 1.2667320666909219,
"ce_q1": 0.1371321489661932,
"ppl_q1": 1.1477951260209083,
"ce_q2": 0.20063013055175544,
"ppl_q2": 1.2238424528241159,
"ce_q3": 0.2660925634428859,
"ppl_q3": 1.3078379932045936,
"ce_q4": 0.3347123210243881,
"ppl_q4": 1.4026392904520035,
"duration": 9768.114993572235
},
"valid": {
"ce": 0.22464384723313247,
"ppl": 1.2539367404165147,
"ce_q1": 0.12969526610796964,
"ppl_q1": 1.139224242560471,
"ce_q2": 0.19264341051442713,
"ppl_q2": 1.2139757283126251,
"ce_q3": 0.2547223637752895,
"ppl_q3": 1.292766515212723,
"ce_q4": 0.3215143531560898,
"ppl_q4": 1.383761552315724,
"duration": 368.23194789886475
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.86219987000525,
"ce": 0.2342256380915642,
"ppl": 1.266316395699978,
"ce_q1": 0.1369770624432713,
"ppl_q1": 1.1476514223814012,
"ce_q2": 0.20028982244245708,
"ppl_q2": 1.2234873626828193,
"ce_q3": 0.2660375401973724,
"ppl_q3": 1.3079467360973358,
"ce_q4": 0.3335981272011995,
"ppl_q4": 1.4013232781887055,
"duration": 9705.977561950684
},
"valid": {
"ce": 0.22461296155860153,
"ppl": 1.2538884289657013,
"ce_q1": 0.1294288910170899,
"ppl_q1": 1.1389119293116317,
"ce_q2": 0.19257787992305395,
"ppl_q2": 1.2138880461077146,
"ce_q3": 0.25462750090828423,
"ppl_q3": 1.2926320667508282,
"ce_q4": 0.3218175761307342,
"ppl_q4": 1.3841760882848426,
"duration": 368.38805413246155
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8433113096654415,
"ce": 0.23467472491413355,
"ppl": 1.2667657610774041,
"ce_q1": 0.1371600694935769,
"ppl_q1": 1.1478181686997413,
"ce_q2": 0.20055909070000053,
"ppl_q2": 1.223722323358059,
"ce_q3": 0.2663664872609079,
"ppl_q3": 1.3082173136472701,
"ce_q4": 0.33461325147002935,
"ppl_q4": 1.402521133005619,
"duration": 9708.52119755745
},
"valid": {
"ce": 0.2242452059931393,
"ppl": 1.2534274828584888,
"ce_q1": 0.12902310716954968,
"ppl_q1": 1.138451891609385,
"ce_q2": 0.19203658024721507,
"ppl_q2": 1.2132271784770339,
"ce_q3": 0.2544846135792853,
"ppl_q3": 1.2924500884889047,
"ce_q4": 0.3214365185438832,
"ppl_q4": 1.3836491334287426,
"duration": 366.5915756225586
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8657613289952278,
"ce": 0.23252062162570655,
"ppl": 1.2639738714098931,
"ce_q1": 0.13543551043607294,
"ppl_q1": 1.145810266494751,
"ce_q2": 0.19870789982564746,
"ppl_q2": 1.2214089124798775,
"ce_q3": 0.2638619406186044,
"ppl_q3": 1.3048596836328505,
"ce_q4": 0.3320771352984011,
"ppl_q4": 1.3988350221514703,
"duration": 9681.17730140686
},
"valid": {
"ce": 0.2237146500545212,
"ppl": 1.252752418759503,
"ce_q1": 0.12870671661405625,
"ppl_q1": 1.1380892780762684,
"ce_q2": 0.19166359692057477,
"ppl_q2": 1.2127650432948824,
"ce_q3": 0.25372541592090947,
"ppl_q3": 1.291452762446826,
"ce_q4": 0.3207628672258763,
"ppl_q4": 1.382697487179237,
"duration": 366.955242395401
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8897006872445344,
"ce": 0.2343676543449983,
"ppl": 1.2663400563001632,
"ce_q1": 0.13655680075054988,
"ppl_q1": 1.147111685693264,
"ce_q2": 0.20027388502657414,
"ppl_q2": 1.2233549463748932,
"ce_q3": 0.26577890779823066,
"ppl_q3": 1.3073822123408319,
"ce_q4": 0.334861023417674,
"ppl_q4": 1.4028073732852935,
"duration": 9676.316682100296
},
"valid": {
"ce": 0.223639078438282,
"ppl": 1.2526614967780778,
"ce_q1": 0.12824694199275366,
"ppl_q1": 1.1375624590282198,
"ce_q2": 0.1917092931232875,
"ppl_q2": 1.2128265417074855,
"ce_q3": 0.25373853082898296,
"ppl_q3": 1.2914758920669556,
"ce_q4": 0.32086155554161794,
"ppl_q4": 1.3828491953354847,
"duration": 365.9454789161682
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8613627022206783,
"ce": 0.23115612630918622,
"ppl": 1.262145898103714,
"ce_q1": 0.13431656374409795,
"ppl_q1": 1.144490255534649,
"ce_q2": 0.19763093764148654,
"ppl_q2": 1.2200254902243615,
"ce_q3": 0.26261546912789346,
"ppl_q3": 1.3030886825323105,
"ce_q4": 0.3300615347065032,
"ppl_q4": 1.3958034124970435,
"duration": 9693.59753704071
},
"valid": {
"ce": 0.22312146915665157,
"ppl": 1.252003546002545,
"ce_q1": 0.1278508921872966,
"ppl_q1": 1.1371061364306678,
"ce_q2": 0.19106027465077896,
"ppl_q2": 1.212027967730655,
"ce_q3": 0.2531561288463918,
"ppl_q3": 1.2907147467890872,
"ce_q4": 0.3204185841958734,
"ppl_q4": 1.3822253308718717,
"duration": 366.94298481941223
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.908048603400588,
"ce": 0.235454489313066,
"ppl": 1.2677685154080391,
"ce_q1": 0.13675571073405446,
"ppl_q1": 1.14733238530159,
"ce_q2": 0.20070319144427776,
"ppl_q2": 1.2238985011577606,
"ce_q3": 0.26769069029390813,
"ppl_q3": 1.3099823869466782,
"ce_q4": 0.3366683651320636,
"ppl_q4": 1.4055282616615294,
"duration": 9683.2853038311
},
"valid": {
"ce": 0.22287857579656795,
"ppl": 1.251698582987242,
"ce_q1": 0.12748240839831437,
"ppl_q1": 1.1366879064825517,
"ce_q2": 0.19075078394594072,
"ppl_q2": 1.2116518926016893,
"ce_q3": 0.2531034140081345,
"ppl_q3": 1.290647349780119,
"ce_q4": 0.32017770070063917,
"ppl_q4": 1.3818864822387695,
"duration": 368.0078036785126
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.8907943293452263,
"ce": 0.2334776145145297,
"ppl": 1.265300272166729,
"ce_q1": 0.13528298148326576,
"ppl_q1": 1.1456673826575279,
"ce_q2": 0.19886671376228332,
"ppl_q2": 1.221681811749935,
"ce_q3": 0.26553389417007567,
"ppl_q3": 1.307193623483181,
"ce_q4": 0.33422686894610526,
"ppl_q4": 1.4021515442728996,
"duration": 9695.132495880127
},
"valid": {
"ce": 0.22244266816709615,
"ppl": 1.251152749303021,
"ce_q1": 0.12718283983914158,
"ppl_q1": 1.1363440857657903,
"ce_q2": 0.19031281929604615,
"ppl_q2": 1.2111205979238582,
"ce_q3": 0.2524469843770884,
"ppl_q3": 1.289795385131353,
"ce_q4": 0.31982803495624396,
"ppl_q4": 1.381416277040409,
"duration": 366.9203655719757
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9096775303632021,
"ce": 0.23506063682585954,
"ppl": 1.2671895247101783,
"ce_q1": 0.13643693218752742,
"ppl_q1": 1.1469796419143676,
"ce_q2": 0.20069455729424954,
"ppl_q2": 1.2238526966571808,
"ce_q3": 0.26717664779350164,
"ppl_q3": 1.3091547988057137,
"ce_q4": 0.3359344099313021,
"ppl_q4": 1.4042422744631766,
"duration": 9707.760141849518
},
"valid": {
"ce": 0.22256086521510837,
"ppl": 1.2512956631334522,
"ce_q1": 0.12733207147898554,
"ppl_q1": 1.1365127065513707,
"ce_q2": 0.1904381896498837,
"ppl_q2": 1.2112725671333602,
"ce_q3": 0.2526305061352404,
"ppl_q3": 1.2900259404242793,
"ce_q4": 0.3198426975102364,
"ppl_q4": 1.3814161517952062,
"duration": 368.1453652381897
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9211164204627276,
"ce": 0.23423236275464296,
"ppl": 1.2661625984311105,
"ce_q1": 0.135913484364748,
"ppl_q1": 1.146407061636448,
"ce_q2": 0.1996651696469635,
"ppl_q2": 1.2226304235458374,
"ce_q3": 0.26611007867753506,
"ppl_q3": 1.3077730984091758,
"ce_q4": 0.3352407186329365,
"ppl_q4": 1.4032266647219658,
"duration": 9650.361552000046
},
"valid": {
"ce": 0.22240206665253337,
"ppl": 1.251096153561073,
"ce_q1": 0.12683537272335607,
"ppl_q1": 1.135945184321343,
"ce_q2": 0.19016662504099593,
"ppl_q2": 1.2109397468687613,
"ce_q3": 0.25264612217492693,
"ppl_q3": 1.2900513621825207,
"ce_q4": 0.3199601495945001,
"ppl_q4": 1.3815833918655975,
"duration": 361.4666290283203
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9272204228788614,
"ce": 0.23298123812116683,
"ppl": 1.264630047082901,
"ce_q1": 0.13471630371920765,
"ppl_q1": 1.145032915711403,
"ce_q2": 0.19840975393727422,
"ppl_q2": 1.2211361768841744,
"ce_q3": 0.26513129886984826,
"ppl_q3": 1.3065884143710136,
"ce_q4": 0.3336675958223641,
"ppl_q4": 1.4011370757818222,
"duration": 9633.943640232086
},
"valid": {
"ce": 0.22227797270575655,
"ppl": 1.2509393692016602,
"ce_q1": 0.12701940819432464,
"ppl_q1": 1.1361545852467985,
"ce_q2": 0.19031501438798784,
"ppl_q2": 1.211118766024143,
"ce_q3": 0.2521979266518279,
"ppl_q3": 1.2894670570952982,
"ce_q4": 0.31957953791075117,
"ppl_q4": 1.381051922146278,
"duration": 367.50013637542725
},
"evaluate": {
"duration": 0.00047206878662109375
},
"generate": {
"rtf": 0.14413857460021973,
"duration": 6.499833822250366
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9470209015160799,
"ce": 0.23201891387626528,
"ppl": 1.2634971190094948,
"ce_q1": 0.13434666631557046,
"ppl_q1": 1.1446369975805282,
"ce_q2": 0.19790984624996782,
"ppl_q2": 1.2205443491339683,
"ce_q3": 0.2639150283038616,
"ppl_q3": 1.305118322134018,
"ce_q4": 0.33190411560982463,
"ppl_q4": 1.3989235188364983,
"duration": 9666.763538837433
},
"valid": {
"ce": 0.2217031944590279,
"ppl": 1.2502088878728166,
"ce_q1": 0.12630884429510636,
"ppl_q1": 1.1353401156920422,
"ce_q2": 0.18956488606673252,
"ppl_q2": 1.210199915910069,
"ce_q3": 0.2519025809214085,
"ppl_q3": 1.2890822464906717,
"ce_q4": 0.3190364658455305,
"ppl_q4": 1.380279086813142,
"duration": 365.5077362060547
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9266521014720202,
"ce": 0.22974622504785658,
"ppl": 1.2605374244451524,
"ce_q1": 0.13304848539456726,
"ppl_q1": 1.1431146758198738,
"ce_q2": 0.19607514742948115,
"ppl_q2": 1.2182835537195205,
"ce_q3": 0.26102787981554865,
"ppl_q3": 1.3012245599627494,
"ce_q4": 0.3288333866894245,
"ppl_q4": 1.3944026638269424,
"duration": 9671.954688549042
},
"valid": {
"ce": 0.22169184458406666,
"ppl": 1.2501893918725508,
"ce_q1": 0.12631878252082232,
"ppl_q1": 1.1353501911404766,
"ce_q2": 0.18967997424210173,
"ppl_q2": 1.2103372540655015,
"ce_q3": 0.2517635933583296,
"ppl_q3": 1.288890016229847,
"ce_q4": 0.31900502684750137,
"ppl_q4": 1.3802283428892304,
"duration": 365.62072372436523
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.948769894182682,
"ce": 0.23166203208640218,
"ppl": 1.2628923121094704,
"ce_q1": 0.13396896211337297,
"ppl_q1": 1.144148562014103,
"ce_q2": 0.19750558260828258,
"ppl_q2": 1.2199700670838356,
"ce_q3": 0.2633515786156058,
"ppl_q3": 1.3041578865051269,
"ce_q4": 0.3318220050185919,
"ppl_q4": 1.3984629881978035,
"duration": 9607.44147324562
},
"valid": {
"ce": 0.22155549065976204,
"ppl": 1.2500215316120582,
"ce_q1": 0.12599047796824311,
"ppl_q1": 1.1349758573725253,
"ce_q2": 0.18938914262041262,
"ppl_q2": 1.2099834620198118,
"ce_q3": 0.2518265888660769,
"ppl_q3": 1.2889760898638376,
"ce_q4": 0.31901575096800355,
"ppl_q4": 1.3802585405639456,
"duration": 361.4547076225281
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9637638848721981,
"ce": 0.2304306443668902,
"ppl": 1.2613646184802056,
"ce_q1": 0.13304610812384635,
"ppl_q1": 1.1430829654335977,
"ce_q2": 0.19657587004452945,
"ppl_q2": 1.2188454918861389,
"ce_q3": 0.2620207087360322,
"ppl_q3": 1.3024909216761589,
"ce_q4": 0.3300798907130957,
"ppl_q4": 1.3961113179922104,
"duration": 9569.696407794952
},
"valid": {
"ce": 0.2211502579194081,
"ppl": 1.2495146401320831,
"ce_q1": 0.12569607765991478,
"ppl_q1": 1.134642685515971,
"ce_q2": 0.18895255510188355,
"ppl_q2": 1.2094538347630561,
"ce_q3": 0.2514371895526029,
"ppl_q3": 1.2884815086292316,
"ce_q4": 0.31851520832580854,
"ppl_q4": 1.379555634305447,
"duration": 361.3419349193573
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9485900522023439,
"ce": 0.2294189603999257,
"ppl": 1.2599869817495346,
"ce_q1": 0.13221628443337977,
"ppl_q1": 1.1421014306545259,
"ce_q2": 0.19559517883323133,
"ppl_q2": 1.217570562660694,
"ce_q3": 0.26103992250189184,
"ppl_q3": 1.3010993636846542,
"ce_q4": 0.3288244555331767,
"ppl_q4": 1.3941211062669754,
"duration": 9602.91431236267
},
"valid": {
"ce": 0.22080804407596588,
"ppl": 1.2490805538394782,
"ce_q1": 0.12515957323433477,
"ppl_q1": 1.1340282853645614,
"ce_q2": 0.18858369722773757,
"ppl_q2": 1.209003923814508,
"ce_q3": 0.25110574641936945,
"ppl_q3": 1.288043412981154,
"ce_q4": 0.3183831612143335,
"ppl_q4": 1.3793715962880775,
"duration": 365.63708662986755
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9650584135204554,
"ce": 0.23151149417087435,
"ppl": 1.2626154228448867,
"ce_q1": 0.13360461187921466,
"ppl_q1": 1.1436857355833054,
"ce_q2": 0.19745921243727207,
"ppl_q2": 1.2198266586065292,
"ce_q3": 0.2633057012632489,
"ppl_q3": 1.3040281805992127,
"ce_q4": 0.3316764515675604,
"ppl_q4": 1.398113205909729,
"duration": 9679.771156787872
},
"valid": {
"ce": 0.22038969501287123,
"ppl": 1.2485525049740755,
"ce_q1": 0.12510413186082356,
"ppl_q1": 1.133963467199591,
"ce_q2": 0.18808293550074856,
"ppl_q2": 1.2083929852594304,
"ce_q3": 0.2506328007277054,
"ppl_q3": 1.287423654447628,
"ce_q4": 0.31773890932149523,
"ppl_q4": 1.3784759663328339,
"duration": 366.63561272621155
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9775146120935678,
"ce": 0.23115618247911335,
"ppl": 1.2621650641560556,
"ce_q1": 0.1330493483040482,
"ppl_q1": 1.1430369266271592,
"ce_q2": 0.1969981191176921,
"ppl_q2": 1.2192553377747535,
"ce_q3": 0.2629088137000799,
"ppl_q3": 1.303508770942688,
"ce_q4": 0.3316684479638934,
"ppl_q4": 1.3981463550329207,
"duration": 9685.887311220169
},
"valid": {
"ce": 0.22074471017982386,
"ppl": 1.2489974664736399,
"ce_q1": 0.12516663530016248,
"ppl_q1": 1.1340331970890867,
"ce_q2": 0.1884288596390169,
"ppl_q2": 1.2088091509251655,
"ce_q3": 0.25105338317306736,
"ppl_q3": 1.2879743183715433,
"ce_q4": 0.31832996312576006,
"ppl_q4": 1.3792952268938474,
"duration": 365.84961676597595
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.0191115493029357,
"ce": 0.22931050305441023,
"ppl": 1.26009128677845,
"ce_q1": 0.13216725342161953,
"ppl_q1": 1.142144699573517,
"ce_q2": 0.19550814217142762,
"ppl_q2": 1.217654495894909,
"ce_q3": 0.26090616297349334,
"ppl_q3": 1.301205468416214,
"ce_q4": 0.3286604534350336,
"ppl_q4": 1.3944075469374657,
"duration": 9914.915214776993
},
"valid": {
"ce": 0.22041845887522155,
"ppl": 1.2485858669763878,
"ce_q1": 0.1250342290046849,
"ppl_q1": 1.133883601502527,
"ce_q2": 0.18824795378914363,
"ppl_q2": 1.2085899597481837,
"ce_q3": 0.2507074797832513,
"ppl_q3": 1.2875178690198101,
"ce_q4": 0.3176841750929627,
"ppl_q4": 1.378393850749052,
"duration": 387.12232065200806
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9639001195579767,
"ce": 0.2309434513747692,
"ppl": 1.2620587416291238,
"ce_q1": 0.13269876553304494,
"ppl_q1": 1.1426936247944832,
"ce_q2": 0.19676523014716804,
"ppl_q2": 1.2190876905918122,
"ce_q3": 0.2627004101313651,
"ppl_q3": 1.3034465929865837,
"ce_q4": 0.33160940039902925,
"ppl_q4": 1.3983913182616234,
"duration": 9993.127159833908
},
"valid": {
"ce": 0.2200620936442025,
"ppl": 1.2481322409231452,
"ce_q1": 0.12471365707018707,
"ppl_q1": 1.133514239818235,
"ce_q2": 0.18758306359942956,
"ppl_q2": 1.2077742784838132,
"ce_q3": 0.250356066453306,
"ppl_q3": 1.2870621062532257,
"ce_q4": 0.3175955880669099,
"ppl_q4": 1.3782608735410473,
"duration": 365.55388736724854
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.0031014182716609,
"ce": 0.23244657453894615,
"ppl": 1.2638761784434318,
"ce_q1": 0.13384626237675548,
"ppl_q1": 1.1439940058588982,
"ce_q2": 0.19792362372763456,
"ppl_q2": 1.2204588510394097,
"ce_q3": 0.2645719394423068,
"ppl_q3": 1.305765799164772,
"ce_q4": 0.33344447235390545,
"ppl_q4": 1.4007595770955086,
"duration": 9666.28326678276
},
"valid": {
"ce": 0.219994455575943,
"ppl": 1.2480462276482884,
"ce_q1": 0.12452223288673389,
"ppl_q1": 1.1332957125917267,
"ce_q2": 0.18762184415436997,
"ppl_q2": 1.2078235677525968,
"ce_q3": 0.25026123687813556,
"ppl_q3": 1.2869350759288933,
"ce_q4": 0.31757251031791106,
"ppl_q4": 1.3782256147529506,
"duration": 365.40531611442566
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.0118435633182525,
"ce": 0.23150032332539558,
"ppl": 1.2628177829384803,
"ce_q1": 0.1331249108137563,
"ppl_q1": 1.143229542195797,
"ce_q2": 0.19717838522046804,
"ppl_q2": 1.2196555158495903,
"ce_q3": 0.2636706692278385,
"ppl_q3": 1.3047886480093003,
"ce_q4": 0.3320273279119283,
"ppl_q4": 1.399018600523472,
"duration": 9686.507339954376
},
"valid": {
"ce": 0.22008233008128178,
"ppl": 1.2481568312343163,
"ce_q1": 0.12448131703311884,
"ppl_q1": 1.1332505715044239,
"ce_q2": 0.1878422381757181,
"ppl_q2": 1.2080933021593698,
"ce_q3": 0.25035045069607,
"ppl_q3": 1.2870467463626136,
"ce_q4": 0.3176553151275538,
"ppl_q4": 1.3783401341377934,
"duration": 365.8681538105011
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 0.9837889188677073,
"ce": 0.22978202194347977,
"ppl": 1.2605826894640924,
"ce_q1": 0.13192134928144514,
"ppl_q1": 1.1418069807291031,
"ce_q2": 0.19567500212416053,
"ppl_q2": 1.2177738382816314,
"ce_q3": 0.261657769985497,
"ppl_q3": 1.302064316213131,
"ce_q4": 0.3298739665001631,
"ppl_q4": 1.3959158515930177,
"duration": 9625.167886734009
},
"valid": {
"ce": 0.2197572504040561,
"ppl": 1.2477463513989993,
"ce_q1": 0.1238613875606392,
"ppl_q1": 1.132543298262584,
"ce_q2": 0.18757582361562342,
"ppl_q2": 1.2077673432193226,
"ce_q3": 0.2501301539095142,
"ppl_q3": 1.2867611737190923,
"ce_q4": 0.3174616377564925,
"ppl_q4": 1.3780674738220022,
"duration": 361.4447102546692
}
},
{
"train": {
"lr": 9.999999999999715e-05,
"grad_norm": 1.0205622183084488,
"ce": 0.2291562844365835,
"ppl": 1.259750031709671,
"ce_q1": 0.13173288409784437,
"ppl_q1": 1.1415968937277794,
"ce_q2": 0.1950578138511628,
"ppl_q2": 1.2170116726756095,
"ce_q3": 0.2607075095996261,
"ppl_q3": 1.3007468707561494,
"ce_q4": 0.32912692898139356,
"ppl_q4": 1.3947249777317048,
"duration": 9559.163588762283
},
"valid": {
"ce": 0.2195237306288526,
"ppl": 1.247450664073606,
"ce_q1": 0.12384205174785626,
"ppl_q1": 1.132516882087611,
"ce_q2": 0.18722588946170446,
"ppl_q2": 1.2073387767695174,
"ce_q3": 0.24984214171955857,
"ppl_q3": 1.2863905897623376,
"ce_q4": 0.3171848390675798,
"ppl_q4": 1.3776818740216992,
"duration": 361.4325656890869
}
}
]