LamaDiab's picture
Training checkpoint - Epoch 4, Step 34368
8cab2f4 verified
{
"metrics_history": [
{
"epoch": 0.05819366852886406,
"global_step": 500,
"eval_loss": 2.536726713180542,
"eval_cosine_accuracy": 0.9404736757278442
},
{
"epoch": 0.11638733705772812,
"global_step": 1000,
"eval_loss": 2.6046745777130127,
"eval_cosine_accuracy": 0.9364559054374695
},
{
"epoch": 0.17458100558659218,
"global_step": 1500,
"eval_loss": 2.540637969970703,
"eval_cosine_accuracy": 0.9412137866020203
},
{
"epoch": 0.23277467411545624,
"global_step": 2000,
"eval_loss": 2.5318424701690674,
"eval_cosine_accuracy": 0.9451258182525635
},
{
"epoch": 0.2909683426443203,
"global_step": 2500,
"eval_loss": 2.474266767501831,
"eval_cosine_accuracy": 0.9467117786407471
},
{
"epoch": 0.34916201117318435,
"global_step": 3000,
"eval_loss": 2.547072649002075,
"eval_cosine_accuracy": 0.9435398578643799
},
{
"epoch": 0.4073556797020484,
"global_step": 3500,
"eval_loss": 2.472174644470215,
"eval_cosine_accuracy": 0.9489321112632751
},
{
"epoch": 0.4655493482309125,
"global_step": 4000,
"eval_loss": 2.5426251888275146,
"eval_cosine_accuracy": 0.9438570737838745
},
{
"epoch": 0.5237430167597765,
"global_step": 4500,
"eval_loss": 2.4768149852752686,
"eval_cosine_accuracy": 0.9473461508750916
},
{
"epoch": 0.5819366852886406,
"global_step": 5000,
"eval_loss": 2.4771170616149902,
"eval_cosine_accuracy": 0.9487206339836121
},
{
"epoch": 0.6401303538175046,
"global_step": 5500,
"eval_loss": 2.6126925945281982,
"eval_cosine_accuracy": 0.9412137866020203
},
{
"epoch": 0.6983240223463687,
"global_step": 6000,
"eval_loss": 2.457711935043335,
"eval_cosine_accuracy": 0.9492493271827698
},
{
"epoch": 0.7565176908752328,
"global_step": 6500,
"eval_loss": 2.48168683052063,
"eval_cosine_accuracy": 0.9438570737838745
},
{
"epoch": 0.8147113594040968,
"global_step": 7000,
"eval_loss": 2.5139832496643066,
"eval_cosine_accuracy": 0.943751335144043
},
{
"epoch": 0.8729050279329609,
"global_step": 7500,
"eval_loss": 2.4431588649749756,
"eval_cosine_accuracy": 0.9494607448577881
},
{
"epoch": 0.931098696461825,
"global_step": 8000,
"eval_loss": 2.5187907218933105,
"eval_cosine_accuracy": 0.9420596361160278
},
{
"epoch": 0.9892923649906891,
"global_step": 8500,
"eval_loss": 2.4668424129486084,
"eval_cosine_accuracy": 0.9469232559204102
},
{
"epoch": 1.047486033519553,
"global_step": 9000,
"eval_loss": 2.6691627502441406,
"eval_cosine_accuracy": 0.9422711133956909
},
{
"epoch": 1.105679702048417,
"global_step": 9500,
"eval_loss": 2.5817720890045166,
"eval_cosine_accuracy": 0.9454430341720581
},
{
"epoch": 1.1638733705772812,
"global_step": 10000,
"eval_loss": 2.5811285972595215,
"eval_cosine_accuracy": 0.9443857073783875
},
{
"epoch": 1.2220670391061452,
"global_step": 10500,
"eval_loss": 2.588257312774658,
"eval_cosine_accuracy": 0.9443857073783875
},
{
"epoch": 1.2802607076350094,
"global_step": 11000,
"eval_loss": 2.626814842224121,
"eval_cosine_accuracy": 0.943751335144043
},
{
"epoch": 1.3384543761638734,
"global_step": 11500,
"eval_loss": 2.5278029441833496,
"eval_cosine_accuracy": 0.9466060400009155
},
{
"epoch": 1.3966480446927374,
"global_step": 12000,
"eval_loss": 2.387155532836914,
"eval_cosine_accuracy": 0.9545358419418335
},
{
"epoch": 1.4548417132216014,
"global_step": 12500,
"eval_loss": 2.531130313873291,
"eval_cosine_accuracy": 0.9511524438858032
},
{
"epoch": 1.5130353817504656,
"global_step": 13000,
"eval_loss": 2.4939699172973633,
"eval_cosine_accuracy": 0.9498836994171143
},
{
"epoch": 1.5712290502793296,
"global_step": 13500,
"eval_loss": 2.3089163303375244,
"eval_cosine_accuracy": 0.9558045864105225
},
{
"epoch": 1.6294227188081938,
"global_step": 14000,
"eval_loss": 2.4148993492126465,
"eval_cosine_accuracy": 0.9548530578613281
},
{
"epoch": 1.6876163873370578,
"global_step": 14500,
"eval_loss": 2.3580262660980225,
"eval_cosine_accuracy": 0.9537957310676575
},
{
"epoch": 1.7458100558659218,
"global_step": 15000,
"eval_loss": 2.4263856410980225,
"eval_cosine_accuracy": 0.9540072083473206
},
{
"epoch": 1.8040037243947857,
"global_step": 15500,
"eval_loss": 2.4231128692626953,
"eval_cosine_accuracy": 0.9536899924278259
},
{
"epoch": 1.86219739292365,
"global_step": 16000,
"eval_loss": 2.395444393157959,
"eval_cosine_accuracy": 0.954430103302002
},
{
"epoch": 1.920391061452514,
"global_step": 16500,
"eval_loss": 2.3798062801361084,
"eval_cosine_accuracy": 0.9555931687355042
},
{
"epoch": 1.9785847299813781,
"global_step": 17000,
"eval_loss": 2.3469178676605225,
"eval_cosine_accuracy": 0.9586593508720398
},
{
"epoch": 2.036778398510242,
"global_step": 17500,
"eval_loss": 2.543642044067383,
"eval_cosine_accuracy": 0.9502009153366089
},
{
"epoch": 2.094972067039106,
"global_step": 18000,
"eval_loss": 2.522242784500122,
"eval_cosine_accuracy": 0.9498836994171143
},
{
"epoch": 2.15316573556797,
"global_step": 18500,
"eval_loss": 2.5265400409698486,
"eval_cosine_accuracy": 0.9517868757247925
},
{
"epoch": 2.211359404096834,
"global_step": 19000,
"eval_loss": 2.3943419456481934,
"eval_cosine_accuracy": 0.954641580581665
},
{
"epoch": 2.2695530726256985,
"global_step": 19500,
"eval_loss": 2.513169288635254,
"eval_cosine_accuracy": 0.9505180716514587
},
{
"epoch": 2.3277467411545625,
"global_step": 20000,
"eval_loss": 2.3868706226348877,
"eval_cosine_accuracy": 0.954641580581665
},
{
"epoch": 2.3859404096834265,
"global_step": 20500,
"eval_loss": 2.3330609798431396,
"eval_cosine_accuracy": 0.9550644755363464
},
{
"epoch": 2.4441340782122905,
"global_step": 21000,
"eval_loss": 2.363619327545166,
"eval_cosine_accuracy": 0.954430103302002
},
{
"epoch": 2.5023277467411544,
"global_step": 21500,
"eval_loss": 2.4074714183807373,
"eval_cosine_accuracy": 0.9541129469871521
},
{
"epoch": 2.560521415270019,
"global_step": 22000,
"eval_loss": 2.359633207321167,
"eval_cosine_accuracy": 0.9570733904838562
},
{
"epoch": 2.618715083798883,
"global_step": 22500,
"eval_loss": 2.345329999923706,
"eval_cosine_accuracy": 0.9581306576728821
},
{
"epoch": 2.676908752327747,
"global_step": 23000,
"eval_loss": 2.347712278366089,
"eval_cosine_accuracy": 0.9565446972846985
},
{
"epoch": 2.735102420856611,
"global_step": 23500,
"eval_loss": 2.31443190574646,
"eval_cosine_accuracy": 0.9582363963127136
},
{
"epoch": 2.793296089385475,
"global_step": 24000,
"eval_loss": 2.3241617679595947,
"eval_cosine_accuracy": 0.9574962854385376
},
{
"epoch": 2.851489757914339,
"global_step": 24500,
"eval_loss": 2.311241865158081,
"eval_cosine_accuracy": 0.9569676518440247
},
{
"epoch": 2.9096834264432028,
"global_step": 25000,
"eval_loss": 2.3046512603759766,
"eval_cosine_accuracy": 0.9579192399978638
},
{
"epoch": 2.967877094972067,
"global_step": 25500,
"eval_loss": 2.311337947845459,
"eval_cosine_accuracy": 0.9583421349525452
},
{
"epoch": 3.026070763500931,
"global_step": 26000,
"eval_loss": 2.5784075260162354,
"eval_cosine_accuracy": 0.9500951766967773
},
{
"epoch": 3.084264432029795,
"global_step": 26500,
"eval_loss": 2.527648448944092,
"eval_cosine_accuracy": 0.9526326656341553
},
{
"epoch": 3.142458100558659,
"global_step": 27000,
"eval_loss": 2.4859249591827393,
"eval_cosine_accuracy": 0.954430103302002
},
{
"epoch": 3.200651769087523,
"global_step": 27500,
"eval_loss": 2.4097483158111572,
"eval_cosine_accuracy": 0.9561218023300171
},
{
"epoch": 3.2588454376163876,
"global_step": 28000,
"eval_loss": 2.3856334686279297,
"eval_cosine_accuracy": 0.9569676518440247
},
{
"epoch": 3.3170391061452515,
"global_step": 28500,
"eval_loss": 2.345590114593506,
"eval_cosine_accuracy": 0.9565446972846985
},
{
"epoch": 3.3752327746741155,
"global_step": 29000,
"eval_loss": 2.3601977825164795,
"eval_cosine_accuracy": 0.9567561745643616
},
{
"epoch": 3.4334264432029795,
"global_step": 29500,
"eval_loss": 2.3479251861572266,
"eval_cosine_accuracy": 0.9580249786376953
},
{
"epoch": 3.4916201117318435,
"global_step": 30000,
"eval_loss": 2.3353111743927,
"eval_cosine_accuracy": 0.9583421349525452
},
{
"epoch": 3.5498137802607075,
"global_step": 30500,
"eval_loss": 2.319936752319336,
"eval_cosine_accuracy": 0.9588707685470581
},
{
"epoch": 3.6080074487895715,
"global_step": 31000,
"eval_loss": 2.3078086376190186,
"eval_cosine_accuracy": 0.9584478735923767
},
{
"epoch": 3.666201117318436,
"global_step": 31500,
"eval_loss": 2.305248260498047,
"eval_cosine_accuracy": 0.9590822458267212
},
{
"epoch": 3.7243947858473,
"global_step": 32000,
"eval_loss": 2.3091342449188232,
"eval_cosine_accuracy": 0.9586593508720398
},
{
"epoch": 3.782588454376164,
"global_step": 32500,
"eval_loss": 2.3073363304138184,
"eval_cosine_accuracy": 0.9591879844665527
},
{
"epoch": 3.840782122905028,
"global_step": 33000,
"eval_loss": 2.3094964027404785,
"eval_cosine_accuracy": 0.9587650895118713
},
{
"epoch": 3.898975791433892,
"global_step": 33500,
"eval_loss": 2.3104605674743652,
"eval_cosine_accuracy": 0.9587650895118713
},
{
"epoch": 3.9571694599627563,
"global_step": 34000,
"eval_loss": 2.3104751110076904,
"eval_cosine_accuracy": 0.9587650895118713
}
],
"current_epoch": 4,
"global_step": 34368
}