LamaDiab's picture
Final training metrics
858b1c6 verified
{
"metrics_history": [
{
"epoch": 0.05819366852886406,
"global_step": 500,
"eval_loss": 0.3265715539455414,
"eval_cosine_accuracy": 0.8337206840515137
},
{
"epoch": 0.11638733705772812,
"global_step": 1000,
"eval_loss": 0.3617343008518219,
"eval_cosine_accuracy": 0.8280160427093506
},
{
"epoch": 0.17458100558659218,
"global_step": 1500,
"eval_loss": 0.35951632261276245,
"eval_cosine_accuracy": 0.8382632732391357
},
{
"epoch": 0.23277467411545624,
"global_step": 2000,
"eval_loss": 0.3711424171924591,
"eval_cosine_accuracy": 0.8358334898948669
},
{
"epoch": 0.2909683426443203,
"global_step": 2500,
"eval_loss": 0.3904484808444977,
"eval_cosine_accuracy": 0.8282273411750793
},
{
"epoch": 0.34916201117318435,
"global_step": 3000,
"eval_loss": 0.38800719380378723,
"eval_cosine_accuracy": 0.822839617729187
},
{
"epoch": 0.4073556797020484,
"global_step": 3500,
"eval_loss": 0.45464685559272766,
"eval_cosine_accuracy": 0.7903021574020386
},
{
"epoch": 0.4655493482309125,
"global_step": 4000,
"eval_loss": 0.4399067163467407,
"eval_cosine_accuracy": 0.7950559854507446
},
{
"epoch": 0.5237430167597765,
"global_step": 4500,
"eval_loss": 0.44711923599243164,
"eval_cosine_accuracy": 0.7893513441085815
},
{
"epoch": 0.5819366852886406,
"global_step": 5000,
"eval_loss": 0.44583871960639954,
"eval_cosine_accuracy": 0.7972744703292847
},
{
"epoch": 0.6401303538175046,
"global_step": 5500,
"eval_loss": 0.4766450822353363,
"eval_cosine_accuracy": 0.7760405540466309
},
{
"epoch": 0.6983240223463687,
"global_step": 6000,
"eval_loss": 0.49710753560066223,
"eval_cosine_accuracy": 0.7615677118301392
},
{
"epoch": 0.7565176908752328,
"global_step": 6500,
"eval_loss": 0.48617255687713623,
"eval_cosine_accuracy": 0.7761462330818176
},
{
"epoch": 0.8147113594040968,
"global_step": 7000,
"eval_loss": 0.514951765537262,
"eval_cosine_accuracy": 0.7470948696136475
},
{
"epoch": 0.8729050279329609,
"global_step": 7500,
"eval_loss": 0.49496394395828247,
"eval_cosine_accuracy": 0.7597718238830566
},
{
"epoch": 0.931098696461825,
"global_step": 8000,
"eval_loss": 0.5210782885551453,
"eval_cosine_accuracy": 0.7321994304656982
},
{
"epoch": 0.9892923649906891,
"global_step": 8500,
"eval_loss": 0.5197136402130127,
"eval_cosine_accuracy": 0.7376927733421326
},
{
"epoch": 1.047486033519553,
"global_step": 9000,
"eval_loss": 0.5157160758972168,
"eval_cosine_accuracy": 0.7394887208938599
},
{
"epoch": 1.105679702048417,
"global_step": 9500,
"eval_loss": 0.5262643694877625,
"eval_cosine_accuracy": 0.7379040718078613
},
{
"epoch": 1.1638733705772812,
"global_step": 10000,
"eval_loss": 0.5438600778579712,
"eval_cosine_accuracy": 0.7258609533309937
},
{
"epoch": 1.2220670391061452,
"global_step": 10500,
"eval_loss": 0.5367482900619507,
"eval_cosine_accuracy": 0.7293471097946167
},
{
"epoch": 1.2802607076350094,
"global_step": 11000,
"eval_loss": 0.5721879005432129,
"eval_cosine_accuracy": 0.7034650444984436
},
{
"epoch": 1.3384543761638734,
"global_step": 11500,
"eval_loss": 0.5377742648124695,
"eval_cosine_accuracy": 0.7343122959136963
},
{
"epoch": 1.3966480446927374,
"global_step": 12000,
"eval_loss": 0.5350662469863892,
"eval_cosine_accuracy": 0.730192244052887
},
{
"epoch": 1.4548417132216014,
"global_step": 12500,
"eval_loss": 0.5529947876930237,
"eval_cosine_accuracy": 0.7192055583000183
},
{
"epoch": 1.5130353817504656,
"global_step": 13000,
"eval_loss": 0.5624330043792725,
"eval_cosine_accuracy": 0.7035706639289856
},
{
"epoch": 1.5712290502793296,
"global_step": 13500,
"eval_loss": 0.5798157453536987,
"eval_cosine_accuracy": 0.6944855451583862
},
{
"epoch": 1.6294227188081938,
"global_step": 14000,
"eval_loss": 0.5619487166404724,
"eval_cosine_accuracy": 0.7114937901496887
},
{
"epoch": 1.6876163873370578,
"global_step": 14500,
"eval_loss": 0.5943849682807922,
"eval_cosine_accuracy": 0.6863511800765991
},
{
"epoch": 1.7458100558659218,
"global_step": 15000,
"eval_loss": 0.5627889633178711,
"eval_cosine_accuracy": 0.712444543838501
},
{
"epoch": 1.8040037243947857,
"global_step": 15500,
"eval_loss": 0.5584973692893982,
"eval_cosine_accuracy": 0.698183000087738
},
{
"epoch": 1.86219739292365,
"global_step": 16000,
"eval_loss": 0.5702577233314514,
"eval_cosine_accuracy": 0.7010352611541748
},
{
"epoch": 1.920391061452514,
"global_step": 16500,
"eval_loss": 0.5965489745140076,
"eval_cosine_accuracy": 0.6801183223724365
},
{
"epoch": 1.9785847299813781,
"global_step": 17000,
"eval_loss": 0.5630908608436584,
"eval_cosine_accuracy": 0.7057891488075256
},
{
"epoch": 2.036778398510242,
"global_step": 17500,
"eval_loss": 0.573241651058197,
"eval_cosine_accuracy": 0.7000845074653625
},
{
"epoch": 2.094972067039106,
"global_step": 18000,
"eval_loss": 0.5863020420074463,
"eval_cosine_accuracy": 0.6810690760612488
},
{
"epoch": 2.15316573556797,
"global_step": 18500,
"eval_loss": 0.5871772766113281,
"eval_cosine_accuracy": 0.6927952766418457
},
{
"epoch": 2.211359404096834,
"global_step": 19000,
"eval_loss": 0.5891428589820862,
"eval_cosine_accuracy": 0.6970208883285522
},
{
"epoch": 2.2695530726256985,
"global_step": 19500,
"eval_loss": 0.600773811340332,
"eval_cosine_accuracy": 0.6833931803703308
},
{
"epoch": 2.3277467411545625,
"global_step": 20000,
"eval_loss": 0.5844529271125793,
"eval_cosine_accuracy": 0.6958588361740112
},
{
"epoch": 2.3859404096834265,
"global_step": 20500,
"eval_loss": 0.5948883295059204,
"eval_cosine_accuracy": 0.6862455010414124
},
{
"epoch": 2.4441340782122905,
"global_step": 21000,
"eval_loss": 0.5971450805664062,
"eval_cosine_accuracy": 0.6829706430435181
},
{
"epoch": 2.5023277467411544,
"global_step": 21500,
"eval_loss": 0.612638533115387,
"eval_cosine_accuracy": 0.6735685467720032
},
{
"epoch": 2.560521415270019,
"global_step": 22000,
"eval_loss": 0.5996671319007874,
"eval_cosine_accuracy": 0.6825480461120605
},
{
"epoch": 2.618715083798883,
"global_step": 22500,
"eval_loss": 0.6220535635948181,
"eval_cosine_accuracy": 0.6731460094451904
},
{
"epoch": 2.676908752327747,
"global_step": 23000,
"eval_loss": 0.6126848459243774,
"eval_cosine_accuracy": 0.6774773001670837
},
{
"epoch": 2.735102420856611,
"global_step": 23500,
"eval_loss": 0.6177366971969604,
"eval_cosine_accuracy": 0.6693429350852966
},
{
"epoch": 2.793296089385475,
"global_step": 24000,
"eval_loss": 0.6116131544113159,
"eval_cosine_accuracy": 0.6803296208381653
},
{
"epoch": 2.851489757914339,
"global_step": 24500,
"eval_loss": 0.6035599112510681,
"eval_cosine_accuracy": 0.6775829195976257
},
{
"epoch": 2.9096834264432028,
"global_step": 25000,
"eval_loss": 0.6071164011955261,
"eval_cosine_accuracy": 0.6763152480125427
},
{
"epoch": 2.967877094972067,
"global_step": 25500,
"eval_loss": 0.6033285856246948,
"eval_cosine_accuracy": 0.6777942180633545
},
{
"epoch": 3.026070763500931,
"global_step": 26000,
"eval_loss": 0.6075280904769897,
"eval_cosine_accuracy": 0.6765264868736267
},
{
"epoch": 3.084264432029795,
"global_step": 26500,
"eval_loss": 0.6169347763061523,
"eval_cosine_accuracy": 0.674836277961731
},
{
"epoch": 3.142458100558659,
"global_step": 27000,
"eval_loss": 0.6152327656745911,
"eval_cosine_accuracy": 0.674836277961731
},
{
"epoch": 3.200651769087523,
"global_step": 27500,
"eval_loss": 0.6097703576087952,
"eval_cosine_accuracy": 0.6781111359596252
},
{
"epoch": 3.2588454376163876,
"global_step": 28000,
"eval_loss": 0.6135534048080444,
"eval_cosine_accuracy": 0.6747305989265442
},
{
"epoch": 3.3170391061452515,
"global_step": 28500,
"eval_loss": 0.6127398610115051,
"eval_cosine_accuracy": 0.6752588152885437
},
{
"epoch": 3.3752327746741155,
"global_step": 29000,
"eval_loss": 0.6184883117675781,
"eval_cosine_accuracy": 0.6732516288757324
},
{
"epoch": 3.4334264432029795,
"global_step": 29500,
"eval_loss": 0.6146544218063354,
"eval_cosine_accuracy": 0.6731460094451904
},
{
"epoch": 3.4916201117318435,
"global_step": 30000,
"eval_loss": 0.6132456660270691,
"eval_cosine_accuracy": 0.6731460094451904
},
{
"epoch": 3.5498137802607075,
"global_step": 30500,
"eval_loss": 0.6162088513374329,
"eval_cosine_accuracy": 0.6726177930831909
},
{
"epoch": 3.6080074487895715,
"global_step": 31000,
"eval_loss": 0.6143919229507446,
"eval_cosine_accuracy": 0.6745193600654602
},
{
"epoch": 3.666201117318436,
"global_step": 31500,
"eval_loss": 0.6197054982185364,
"eval_cosine_accuracy": 0.6723008751869202
},
{
"epoch": 3.7243947858473,
"global_step": 32000,
"eval_loss": 0.619126558303833,
"eval_cosine_accuracy": 0.6715613603591919
},
{
"epoch": 3.782588454376164,
"global_step": 32500,
"eval_loss": 0.6180660128593445,
"eval_cosine_accuracy": 0.6720895767211914
},
{
"epoch": 3.840782122905028,
"global_step": 33000,
"eval_loss": 0.6176912188529968,
"eval_cosine_accuracy": 0.6726177930831909
},
{
"epoch": 3.898975791433892,
"global_step": 33500,
"eval_loss": 0.6178871989250183,
"eval_cosine_accuracy": 0.6723008751869202
},
{
"epoch": 3.9571694599627563,
"global_step": 34000,
"eval_loss": 0.6180205345153809,
"eval_cosine_accuracy": 0.6720895767211914
}
],
"total_epochs": 4.0,
"total_steps": 34368
}