LamaDiab's picture
Training checkpoint - Epoch 5, Step 76965
5cffc8c verified
{
"metrics_history": [
{
"epoch": 0.12992918859221725,
"global_step": 2000,
"eval_loss": 0.9158492088317871,
"eval_cosine_accuracy": 0.9490216970443726
},
{
"epoch": 0.2598583771844345,
"global_step": 4000,
"eval_loss": 0.9200904369354248,
"eval_cosine_accuracy": 0.9499735832214355
},
{
"epoch": 0.38978756577665175,
"global_step": 6000,
"eval_loss": 0.8998962640762329,
"eval_cosine_accuracy": 0.9456372261047363
},
{
"epoch": 0.519716754368869,
"global_step": 8000,
"eval_loss": 0.8402906060218811,
"eval_cosine_accuracy": 0.9466948509216309
},
{
"epoch": 0.6496459429610862,
"global_step": 10000,
"eval_loss": 0.8332843780517578,
"eval_cosine_accuracy": 0.947012186050415
},
{
"epoch": 0.7795751315533035,
"global_step": 12000,
"eval_loss": 0.8381510972976685,
"eval_cosine_accuracy": 0.9478582739830017
},
{
"epoch": 0.9095043201455207,
"global_step": 14000,
"eval_loss": 0.8515253663063049,
"eval_cosine_accuracy": 0.9480698108673096
},
{
"epoch": 1.039433508737738,
"global_step": 16000,
"eval_loss": 0.861483097076416,
"eval_cosine_accuracy": 0.9481755495071411
},
{
"epoch": 1.1693626973299551,
"global_step": 18000,
"eval_loss": 0.866976261138916,
"eval_cosine_accuracy": 0.9490216970443726
},
{
"epoch": 1.2992918859221725,
"global_step": 20000,
"eval_loss": 0.8142719268798828,
"eval_cosine_accuracy": 0.9511369466781616
},
{
"epoch": 1.4292210745143896,
"global_step": 22000,
"eval_loss": 0.7982929944992065,
"eval_cosine_accuracy": 0.9521946310997009
},
{
"epoch": 1.559150263106607,
"global_step": 24000,
"eval_loss": 0.7904353141784668,
"eval_cosine_accuracy": 0.9538868069648743
},
{
"epoch": 1.6890794516988241,
"global_step": 26000,
"eval_loss": 0.7433677315711975,
"eval_cosine_accuracy": 0.9561078548431396
},
{
"epoch": 1.8190086402910413,
"global_step": 28000,
"eval_loss": 0.779238760471344,
"eval_cosine_accuracy": 0.9565309286117554
},
{
"epoch": 1.9489378288832586,
"global_step": 30000,
"eval_loss": 0.7882058024406433,
"eval_cosine_accuracy": 0.9578000903129578
},
{
"epoch": 2.078867017475476,
"global_step": 32000,
"eval_loss": 0.8047419786453247,
"eval_cosine_accuracy": 0.9568482041358948
},
{
"epoch": 2.208796206067693,
"global_step": 34000,
"eval_loss": 0.7193956971168518,
"eval_cosine_accuracy": 0.959280788898468
},
{
"epoch": 2.3387253946599103,
"global_step": 36000,
"eval_loss": 0.725292444229126,
"eval_cosine_accuracy": 0.9604442119598389
},
{
"epoch": 2.4686545832521274,
"global_step": 38000,
"eval_loss": 0.7545588612556458,
"eval_cosine_accuracy": 0.9617133736610413
},
{
"epoch": 2.598583771844345,
"global_step": 40000,
"eval_loss": 0.7361720204353333,
"eval_cosine_accuracy": 0.9620306491851807
},
{
"epoch": 2.728512960436562,
"global_step": 42000,
"eval_loss": 0.7261704206466675,
"eval_cosine_accuracy": 0.9628767967224121
},
{
"epoch": 2.8584421490287792,
"global_step": 44000,
"eval_loss": 0.7182765603065491,
"eval_cosine_accuracy": 0.96308833360672
},
{
"epoch": 2.988371337620997,
"global_step": 46000,
"eval_loss": 0.819146454334259,
"eval_cosine_accuracy": 0.9553675055503845
},
{
"epoch": 3.118300526213214,
"global_step": 48000,
"eval_loss": 0.7653650641441345,
"eval_cosine_accuracy": 0.9622421860694885
},
{
"epoch": 3.248229714805431,
"global_step": 50000,
"eval_loss": 0.7210116386413574,
"eval_cosine_accuracy": 0.9646747708320618
},
{
"epoch": 3.3781589033976482,
"global_step": 52000,
"eval_loss": 0.7164391875267029,
"eval_cosine_accuracy": 0.9627709984779358
},
{
"epoch": 3.5080880919898654,
"global_step": 54000,
"eval_loss": 0.6905584931373596,
"eval_cosine_accuracy": 0.9658381938934326
},
{
"epoch": 3.6380172805820825,
"global_step": 56000,
"eval_loss": 0.6991865634918213,
"eval_cosine_accuracy": 0.9643574953079224
},
{
"epoch": 3.7679464691743,
"global_step": 58000,
"eval_loss": 0.6876057386398315,
"eval_cosine_accuracy": 0.9658381938934326
},
{
"epoch": 3.8978756577665172,
"global_step": 60000,
"eval_loss": 0.6974127888679504,
"eval_cosine_accuracy": 0.9663670063018799
},
{
"epoch": 4.027804846358735,
"global_step": 62000,
"eval_loss": 0.7903416752815247,
"eval_cosine_accuracy": 0.9637228846549988
},
{
"epoch": 4.157734034950952,
"global_step": 64000,
"eval_loss": 0.702480673789978,
"eval_cosine_accuracy": 0.9673188924789429
},
{
"epoch": 4.287663223543169,
"global_step": 66000,
"eval_loss": 0.6973665952682495,
"eval_cosine_accuracy": 0.966155469417572
},
{
"epoch": 4.417592412135386,
"global_step": 68000,
"eval_loss": 0.7310513854026794,
"eval_cosine_accuracy": 0.9681649804115295
},
{
"epoch": 4.547521600727603,
"global_step": 70000,
"eval_loss": 0.7204111218452454,
"eval_cosine_accuracy": 0.9675304293632507
},
{
"epoch": 4.6774507893198205,
"global_step": 72000,
"eval_loss": 0.7272541522979736,
"eval_cosine_accuracy": 0.967107355594635
},
{
"epoch": 4.807379977912038,
"global_step": 74000,
"eval_loss": 0.6957398056983948,
"eval_cosine_accuracy": 0.969011127948761
},
{
"epoch": 4.937309166504255,
"global_step": 76000,
"eval_loss": 0.6990842819213867,
"eval_cosine_accuracy": 0.9691168665885925
}
],
"current_epoch": 5,
"global_step": 76965
}