savant_2_gsm8k / training_state.json
broadfield-dev's picture
Checkpoint for SFT at step 150
d793c11 verified
{
"phase": "SFT",
"epoch": 0,
"total_sft_steps": 150,
"metrics": [
{
"Step": 0,
"Metric": "SFT Loss",
"Value": 9.127131462097168
},
{
"Step": 1,
"Metric": "SFT Loss",
"Value": 9.107461929321289
},
{
"Step": 2,
"Metric": "SFT Loss",
"Value": 9.074987411499023
},
{
"Step": 3,
"Metric": "SFT Loss",
"Value": 9.083779335021973
},
{
"Step": 4,
"Metric": "SFT Loss",
"Value": 9.03738784790039
},
{
"Step": 5,
"Metric": "SFT Loss",
"Value": 9.083824157714844
},
{
"Step": 6,
"Metric": "SFT Loss",
"Value": 9.094654083251953
},
{
"Step": 7,
"Metric": "SFT Loss",
"Value": 9.067611694335938
},
{
"Step": 8,
"Metric": "SFT Loss",
"Value": 9.049128532409668
},
{
"Step": 9,
"Metric": "SFT Loss",
"Value": 9.069461822509766
},
{
"Step": 10,
"Metric": "SFT Loss",
"Value": 9.0612154006958
},
{
"Step": 11,
"Metric": "SFT Loss",
"Value": 9.047734260559082
},
{
"Step": 12,
"Metric": "SFT Loss",
"Value": 9.025179862976074
},
{
"Step": 13,
"Metric": "SFT Loss",
"Value": 9.02020263671875
},
{
"Step": 14,
"Metric": "SFT Loss",
"Value": 9.085907936096191
},
{
"Step": 15,
"Metric": "SFT Loss",
"Value": 9.057311058044434
},
{
"Step": 16,
"Metric": "SFT Loss",
"Value": 8.991851806640625
},
{
"Step": 17,
"Metric": "SFT Loss",
"Value": 8.948450088500977
},
{
"Step": 18,
"Metric": "SFT Loss",
"Value": 8.989174842834473
},
{
"Step": 19,
"Metric": "SFT Loss",
"Value": 9.006205558776855
},
{
"Step": 20,
"Metric": "SFT Loss",
"Value": 8.955092430114746
},
{
"Step": 21,
"Metric": "SFT Loss",
"Value": 8.959745407104492
},
{
"Step": 22,
"Metric": "SFT Loss",
"Value": 8.956381797790527
},
{
"Step": 23,
"Metric": "SFT Loss",
"Value": 8.943069458007812
},
{
"Step": 24,
"Metric": "SFT Loss",
"Value": 8.898037910461426
},
{
"Step": 25,
"Metric": "SFT Loss",
"Value": 8.978178024291992
},
{
"Step": 26,
"Metric": "SFT Loss",
"Value": 8.877619743347168
},
{
"Step": 27,
"Metric": "SFT Loss",
"Value": 8.874868392944336
},
{
"Step": 28,
"Metric": "SFT Loss",
"Value": 8.931377410888672
},
{
"Step": 29,
"Metric": "SFT Loss",
"Value": 8.912647247314453
},
{
"Step": 30,
"Metric": "SFT Loss",
"Value": 8.896525382995605
},
{
"Step": 31,
"Metric": "SFT Loss",
"Value": 8.809622764587402
},
{
"Step": 32,
"Metric": "SFT Loss",
"Value": 8.76137638092041
},
{
"Step": 33,
"Metric": "SFT Loss",
"Value": 8.898188591003418
},
{
"Step": 34,
"Metric": "SFT Loss",
"Value": 8.899017333984375
},
{
"Step": 35,
"Metric": "SFT Loss",
"Value": 8.867911338806152
},
{
"Step": 36,
"Metric": "SFT Loss",
"Value": 8.834308624267578
},
{
"Step": 37,
"Metric": "SFT Loss",
"Value": 8.756689071655273
},
{
"Step": 38,
"Metric": "SFT Loss",
"Value": 8.833380699157715
},
{
"Step": 39,
"Metric": "SFT Loss",
"Value": 8.804695129394531
},
{
"Step": 40,
"Metric": "SFT Loss",
"Value": 8.767921447753906
},
{
"Step": 41,
"Metric": "SFT Loss",
"Value": 8.663383483886719
},
{
"Step": 42,
"Metric": "SFT Loss",
"Value": 8.690306663513184
},
{
"Step": 43,
"Metric": "SFT Loss",
"Value": 8.674437522888184
},
{
"Step": 44,
"Metric": "SFT Loss",
"Value": 8.72599983215332
},
{
"Step": 45,
"Metric": "SFT Loss",
"Value": 8.720040321350098
},
{
"Step": 46,
"Metric": "SFT Loss",
"Value": 8.727679252624512
},
{
"Step": 47,
"Metric": "SFT Loss",
"Value": 8.698738098144531
},
{
"Step": 48,
"Metric": "SFT Loss",
"Value": 8.704374313354492
},
{
"Step": 49,
"Metric": "SFT Loss",
"Value": 8.634883880615234
},
{
"Step": 50,
"Metric": "SFT Loss",
"Value": 8.672651290893555
},
{
"Step": 51,
"Metric": "SFT Loss",
"Value": 8.667613983154297
},
{
"Step": 52,
"Metric": "SFT Loss",
"Value": 8.698080062866211
},
{
"Step": 53,
"Metric": "SFT Loss",
"Value": 8.713942527770996
},
{
"Step": 54,
"Metric": "SFT Loss",
"Value": 8.65330696105957
},
{
"Step": 55,
"Metric": "SFT Loss",
"Value": 8.691088676452637
},
{
"Step": 56,
"Metric": "SFT Loss",
"Value": 8.542851448059082
},
{
"Step": 57,
"Metric": "SFT Loss",
"Value": 8.694014549255371
},
{
"Step": 58,
"Metric": "SFT Loss",
"Value": 8.689044952392578
},
{
"Step": 59,
"Metric": "SFT Loss",
"Value": 8.620987892150879
},
{
"Step": 60,
"Metric": "SFT Loss",
"Value": 8.475345611572266
},
{
"Step": 61,
"Metric": "SFT Loss",
"Value": 8.545315742492676
},
{
"Step": 62,
"Metric": "SFT Loss",
"Value": 8.515613555908203
},
{
"Step": 63,
"Metric": "SFT Loss",
"Value": 8.600582122802734
},
{
"Step": 64,
"Metric": "SFT Loss",
"Value": 8.494306564331055
},
{
"Step": 65,
"Metric": "SFT Loss",
"Value": 8.509326934814453
},
{
"Step": 66,
"Metric": "SFT Loss",
"Value": 8.454813957214355
},
{
"Step": 67,
"Metric": "SFT Loss",
"Value": 8.507712364196777
},
{
"Step": 68,
"Metric": "SFT Loss",
"Value": 8.528255462646484
},
{
"Step": 69,
"Metric": "SFT Loss",
"Value": 8.627915382385254
},
{
"Step": 70,
"Metric": "SFT Loss",
"Value": 8.469722747802734
},
{
"Step": 71,
"Metric": "SFT Loss",
"Value": 8.60826301574707
},
{
"Step": 72,
"Metric": "SFT Loss",
"Value": 8.50338077545166
},
{
"Step": 73,
"Metric": "SFT Loss",
"Value": 8.456791877746582
},
{
"Step": 74,
"Metric": "SFT Loss",
"Value": 8.538637161254883
},
{
"Step": 75,
"Metric": "SFT Loss",
"Value": 8.382216453552246
},
{
"Step": 76,
"Metric": "SFT Loss",
"Value": 8.414968490600586
},
{
"Step": 77,
"Metric": "SFT Loss",
"Value": 8.517200469970703
},
{
"Step": 78,
"Metric": "SFT Loss",
"Value": 8.457924842834473
},
{
"Step": 79,
"Metric": "SFT Loss",
"Value": 8.478180885314941
},
{
"Step": 80,
"Metric": "SFT Loss",
"Value": 8.513033866882324
},
{
"Step": 81,
"Metric": "SFT Loss",
"Value": 8.311726570129395
},
{
"Step": 82,
"Metric": "SFT Loss",
"Value": 8.349236488342285
},
{
"Step": 83,
"Metric": "SFT Loss",
"Value": 8.330142974853516
},
{
"Step": 84,
"Metric": "SFT Loss",
"Value": 8.462335586547852
},
{
"Step": 85,
"Metric": "SFT Loss",
"Value": 8.350343704223633
},
{
"Step": 86,
"Metric": "SFT Loss",
"Value": 8.472900390625
},
{
"Step": 87,
"Metric": "SFT Loss",
"Value": 8.307153701782227
},
{
"Step": 88,
"Metric": "SFT Loss",
"Value": 8.43564510345459
},
{
"Step": 89,
"Metric": "SFT Loss",
"Value": 8.356257438659668
},
{
"Step": 90,
"Metric": "SFT Loss",
"Value": 8.356173515319824
},
{
"Step": 91,
"Metric": "SFT Loss",
"Value": 8.416142463684082
},
{
"Step": 92,
"Metric": "SFT Loss",
"Value": 8.21868896484375
},
{
"Step": 93,
"Metric": "SFT Loss",
"Value": 8.2228364944458
},
{
"Step": 94,
"Metric": "SFT Loss",
"Value": 8.340263366699219
},
{
"Step": 95,
"Metric": "SFT Loss",
"Value": 8.186246871948242
},
{
"Step": 96,
"Metric": "SFT Loss",
"Value": 8.426435470581055
},
{
"Step": 97,
"Metric": "SFT Loss",
"Value": 8.297677993774414
},
{
"Step": 98,
"Metric": "SFT Loss",
"Value": 8.3098783493042
},
{
"Step": 99,
"Metric": "SFT Loss",
"Value": 8.25888442993164
},
{
"Step": 100,
"Metric": "SFT Loss",
"Value": 8.235538482666016
},
{
"Step": 101,
"Metric": "SFT Loss",
"Value": 8.270655632019043
},
{
"Step": 102,
"Metric": "SFT Loss",
"Value": 8.269576072692871
},
{
"Step": 103,
"Metric": "SFT Loss",
"Value": 8.274468421936035
},
{
"Step": 104,
"Metric": "SFT Loss",
"Value": 8.309279441833496
},
{
"Step": 105,
"Metric": "SFT Loss",
"Value": 8.239542961120605
},
{
"Step": 106,
"Metric": "SFT Loss",
"Value": 8.188124656677246
},
{
"Step": 107,
"Metric": "SFT Loss",
"Value": 8.163637161254883
},
{
"Step": 108,
"Metric": "SFT Loss",
"Value": 8.162602424621582
},
{
"Step": 109,
"Metric": "SFT Loss",
"Value": 8.176586151123047
},
{
"Step": 110,
"Metric": "SFT Loss",
"Value": 8.174212455749512
},
{
"Step": 111,
"Metric": "SFT Loss",
"Value": 8.19734001159668
},
{
"Step": 112,
"Metric": "SFT Loss",
"Value": 8.076298713684082
},
{
"Step": 113,
"Metric": "SFT Loss",
"Value": 8.18896770477295
},
{
"Step": 114,
"Metric": "SFT Loss",
"Value": 8.258679389953613
},
{
"Step": 115,
"Metric": "SFT Loss",
"Value": 8.18835735321045
},
{
"Step": 116,
"Metric": "SFT Loss",
"Value": 8.127300262451172
},
{
"Step": 117,
"Metric": "SFT Loss",
"Value": 8.145550727844238
},
{
"Step": 118,
"Metric": "SFT Loss",
"Value": 8.09005069732666
},
{
"Step": 119,
"Metric": "SFT Loss",
"Value": 7.936030387878418
},
{
"Step": 120,
"Metric": "SFT Loss",
"Value": 8.104690551757812
},
{
"Step": 121,
"Metric": "SFT Loss",
"Value": 8.058869361877441
},
{
"Step": 122,
"Metric": "SFT Loss",
"Value": 8.058721542358398
},
{
"Step": 123,
"Metric": "SFT Loss",
"Value": 7.885481357574463
},
{
"Step": 124,
"Metric": "SFT Loss",
"Value": 8.024746894836426
},
{
"Step": 125,
"Metric": "SFT Loss",
"Value": 8.017570495605469
},
{
"Step": 126,
"Metric": "SFT Loss",
"Value": 8.01369571685791
},
{
"Step": 127,
"Metric": "SFT Loss",
"Value": 7.956777572631836
},
{
"Step": 128,
"Metric": "SFT Loss",
"Value": 8.059258460998535
},
{
"Step": 129,
"Metric": "SFT Loss",
"Value": 8.099721908569336
},
{
"Step": 130,
"Metric": "SFT Loss",
"Value": 7.995508193969727
},
{
"Step": 131,
"Metric": "SFT Loss",
"Value": 7.869641304016113
},
{
"Step": 132,
"Metric": "SFT Loss",
"Value": 7.967761993408203
},
{
"Step": 133,
"Metric": "SFT Loss",
"Value": 8.04328441619873
},
{
"Step": 134,
"Metric": "SFT Loss",
"Value": 7.801205158233643
},
{
"Step": 135,
"Metric": "SFT Loss",
"Value": 7.971508979797363
},
{
"Step": 136,
"Metric": "SFT Loss",
"Value": 7.872110843658447
},
{
"Step": 137,
"Metric": "SFT Loss",
"Value": 8.073846817016602
},
{
"Step": 138,
"Metric": "SFT Loss",
"Value": 7.676604270935059
},
{
"Step": 139,
"Metric": "SFT Loss",
"Value": 7.913880825042725
},
{
"Step": 140,
"Metric": "SFT Loss",
"Value": 8.005086898803711
},
{
"Step": 141,
"Metric": "SFT Loss",
"Value": 7.983025074005127
},
{
"Step": 142,
"Metric": "SFT Loss",
"Value": 7.844381809234619
},
{
"Step": 143,
"Metric": "SFT Loss",
"Value": 7.966534614562988
},
{
"Step": 144,
"Metric": "SFT Loss",
"Value": 7.799246311187744
},
{
"Step": 145,
"Metric": "SFT Loss",
"Value": 7.769224166870117
},
{
"Step": 146,
"Metric": "SFT Loss",
"Value": 7.8659234046936035
},
{
"Step": 147,
"Metric": "SFT Loss",
"Value": 7.893615245819092
},
{
"Step": 148,
"Metric": "SFT Loss",
"Value": 7.57839822769165
},
{
"Step": 149,
"Metric": "SFT Loss",
"Value": 7.796144485473633
},
{
"Step": 150,
"Metric": "SFT Loss",
"Value": 7.760519504547119
}
],
"sft_complete": false
}