llama-30b-code_easy / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
551e919
[
{
"loss": 0.6935,
"learning_rate": 0.0002,
"epoch": 0.02,
"step": 1
},
{
"loss": 0.6301,
"learning_rate": 0.0002,
"epoch": 0.04,
"step": 2
},
{
"loss": 0.6073,
"learning_rate": 0.0002,
"epoch": 0.05,
"step": 3
},
{
"loss": 0.5667,
"learning_rate": 0.0002,
"epoch": 0.07,
"step": 4
},
{
"loss": 0.4627,
"learning_rate": 0.0002,
"epoch": 0.09,
"step": 5
},
{
"loss": 0.4737,
"learning_rate": 0.0002,
"epoch": 0.11,
"step": 6
},
{
"loss": 0.3356,
"learning_rate": 0.0002,
"epoch": 0.12,
"step": 7
},
{
"loss": 0.27,
"learning_rate": 0.0002,
"epoch": 0.14,
"step": 8
},
{
"loss": 0.28,
"learning_rate": 0.0002,
"epoch": 0.16,
"step": 9
},
{
"loss": 0.3491,
"learning_rate": 0.0002,
"epoch": 0.18,
"step": 10
},
{
"loss": 0.2803,
"learning_rate": 0.0002,
"epoch": 0.19,
"step": 11
},
{
"loss": 0.1596,
"learning_rate": 0.0002,
"epoch": 0.21,
"step": 12
},
{
"loss": 0.1118,
"learning_rate": 0.0002,
"epoch": 0.23,
"step": 13
},
{
"loss": 0.2215,
"learning_rate": 0.0002,
"epoch": 0.25,
"step": 14
},
{
"loss": 0.0815,
"learning_rate": 0.0002,
"epoch": 0.26,
"step": 15
},
{
"loss": 0.1581,
"learning_rate": 0.0002,
"epoch": 0.28,
"step": 16
},
{
"loss": 0.1447,
"learning_rate": 0.0002,
"epoch": 0.3,
"step": 17
},
{
"loss": 0.0793,
"learning_rate": 0.0002,
"epoch": 0.32,
"step": 18
},
{
"loss": 0.0634,
"learning_rate": 0.0002,
"epoch": 0.33,
"step": 19
},
{
"loss": 0.0868,
"learning_rate": 0.0002,
"epoch": 0.35,
"step": 20
},
{
"loss": 0.1339,
"learning_rate": 0.0002,
"epoch": 0.37,
"step": 21
},
{
"loss": 0.0436,
"learning_rate": 0.0002,
"epoch": 0.39,
"step": 22
},
{
"loss": 0.0326,
"learning_rate": 0.0002,
"epoch": 0.4,
"step": 23
},
{
"loss": 0.0309,
"learning_rate": 0.0002,
"epoch": 0.42,
"step": 24
},
{
"loss": 0.4613,
"learning_rate": 0.0002,
"epoch": 0.44,
"step": 25
},
{
"eval_code_easy_loss": 0.22846165299415588,
"eval_code_easy_score": -0.034886911511421204,
"eval_code_easy_brier_score": 0.034886911511421204,
"eval_code_easy_average_probability": 0.9493436217308044,
"eval_code_easy_accuracy": 0.96,
"eval_code_easy_probabilities": [
1.0,
1.0,
0.9999986886978149,
0.9999988079071045,
0.9999972581863403,
0.9999972581863403,
0.8807934522628784,
0.9996591806411743,
1.0,
0.9997110962867737,
0.996894359588623,
0.9885761141777039,
0.9846639037132263,
0.9999998807907104,
0.9999992847442627,
0.9217069745063782,
0.9999998807907104,
0.9999992847442627,
0.9999531507492065,
0.971138596534729,
0.9644115567207336,
0.9999998807907104,
0.9999998807907104,
0.9999996423721313,
1.0,
1.0,
0.9992501139640808,
0.9999996423721313,
0.999998927116394,
0.9999997615814209,
0.9999358654022217,
0.9999948740005493,
0.9999706745147705,
0.9182361364364624,
0.9777969717979431,
0.7950476408004761,
0.07089971750974655,
0.9999998807907104,
0.9611170887947083,
0.999824583530426,
0.9999998807907104,
0.9999997615814209,
0.9999994039535522,
0.9999918937683105,
0.9999996423721313,
0.9999992847442627,
0.9999583959579468,
0.9999964237213135,
0.9999970197677612,
1.0,
0.9999992847442627,
0.7631391286849976,
0.9999997615814209,
0.9999998807907104,
1.0,
1.0,
1.0,
0.9999991655349731,
0.4372449815273285,
0.9999960660934448,
0.9999992847442627,
1.0,
0.989567220211029,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.6681390404701233,
1.02999701994122e-05,
0.0022490699775516987,
1.0,
1.0,
0.9999945163726807,
0.9999951124191284,
0.999752938747406,
0.9999997615814209,
1.0,
1.0,
1.0,
0.9668532013893127,
0.9999983310699463,
0.9879446029663086,
0.9999827146530151,
1.0,
0.9999997615814209,
0.9972673654556274,
0.9581230878829956,
0.9999821186065674,
0.9999935626983643,
0.7346240282058716,
0.9999959468841553,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999996423721313
],
"eval_code_easy_runtime": 41.4523,
"eval_code_easy_samples_per_second": 2.412,
"eval_code_easy_steps_per_second": 0.096,
"epoch": 0.44,
"step": 25
},
{
"eval_code_hard_loss": 0.8444641828536987,
"eval_code_hard_score": -0.21481266617774963,
"eval_code_hard_brier_score": 0.21481266617774963,
"eval_code_hard_average_probability": 0.6489911675453186,
"eval_code_hard_accuracy": 0.71,
"eval_code_hard_probabilities": [
0.9999761581420898,
0.4704570770263672,
0.38770198822021484,
0.9957898259162903,
0.9971027970314026,
0.6636011004447937,
0.3829995095729828,
0.4488725960254669,
0.3862934112548828,
0.4944641590118408,
0.6597261428833008,
0.5888834595680237,
0.9994460940361023,
0.00023105263244360685,
9.57881347858347e-05,
0.9383717179298401,
0.9582164287567139,
0.9960324168205261,
0.0013776113046333194,
0.004925197456032038,
0.0024418227840214968,
0.9448224306106567,
0.8293406367301941,
0.990691065788269,
0.6144397258758545,
0.37276336550712585,
0.7497667670249939,
0.9995079040527344,
0.8595492243766785,
0.8565853238105774,
0.9049152731895447,
0.842837393283844,
0.7425481081008911,
0.9970250725746155,
0.9908040761947632,
0.9856406450271606,
0.23333661258220673,
0.3644156754016876,
0.9999799728393555,
0.5256256461143494,
0.4714035987854004,
0.5990293622016907,
0.7481530904769897,
0.6265391111373901,
0.7847771644592285,
0.9998830556869507,
0.4729439914226532,
0.5146611332893372,
0.9899987578392029,
0.999963641166687,
0.9999411106109619,
0.017366401851177216,
0.25775712728500366,
0.9997989535331726,
0.2128974348306656,
0.27310115098953247,
0.6709675192832947,
0.5412147045135498,
0.5308579206466675,
0.5533190369606018,
0.11031078547239304,
0.0799262598156929,
0.12423858046531677,
0.6619316339492798,
0.6491618156433105,
0.9998986721038818,
0.5845221281051636,
0.9992774128913879,
0.7275769710540771,
0.9403572082519531,
0.9309749007225037,
0.871741771697998,
0.9114173650741577,
0.9771295189857483,
0.9557876586914062,
0.9182456135749817,
0.32342132925987244,
0.5013740062713623,
0.5234308242797852,
0.5439746975898743,
0.5095937252044678,
0.7398637533187866,
0.7255550026893616,
0.7406316995620728,
0.984710156917572,
0.9945735335350037,
0.9810420274734497,
0.5697446465492249,
0.6282893419265747,
0.6032753586769104,
0.40384215116500854,
0.26884448528289795,
0.45188671350479126,
0.6884511709213257,
0.4971124827861786,
0.6430377960205078,
0.6951863169670105,
0.8902100920677185,
0.13663697242736816,
0.9657577872276306
],
"eval_code_hard_runtime": 140.0766,
"eval_code_hard_samples_per_second": 0.714,
"eval_code_hard_steps_per_second": 0.029,
"epoch": 0.44,
"step": 25
},
{
"loss": 0.1113,
"learning_rate": 0.0002,
"epoch": 0.46,
"step": 26
},
{
"loss": 0.0564,
"learning_rate": 0.0002,
"epoch": 0.47,
"step": 27
},
{
"loss": 0.0685,
"learning_rate": 0.0002,
"epoch": 0.49,
"step": 28
},
{
"loss": 0.1366,
"learning_rate": 0.0002,
"epoch": 0.51,
"step": 29
},
{
"loss": 0.0012,
"learning_rate": 0.0002,
"epoch": 0.53,
"step": 30
},
{
"loss": 0.0288,
"learning_rate": 0.0002,
"epoch": 0.54,
"step": 31
},
{
"loss": 0.0287,
"learning_rate": 0.0002,
"epoch": 0.56,
"step": 32
},
{
"loss": 0.0668,
"learning_rate": 0.0002,
"epoch": 0.58,
"step": 33
},
{
"loss": 0.0054,
"learning_rate": 0.0002,
"epoch": 0.6,
"step": 34
},
{
"loss": 0.0058,
"learning_rate": 0.0002,
"epoch": 0.61,
"step": 35
},
{
"loss": 0.1321,
"learning_rate": 0.0002,
"epoch": 0.63,
"step": 36
},
{
"loss": 0.0438,
"learning_rate": 0.0002,
"epoch": 0.65,
"step": 37
},
{
"loss": 0.035,
"learning_rate": 0.0002,
"epoch": 0.67,
"step": 38
},
{
"loss": 0.03,
"learning_rate": 0.0002,
"epoch": 0.68,
"step": 39
},
{
"loss": 0.0043,
"learning_rate": 0.0002,
"epoch": 0.7,
"step": 40
},
{
"loss": 0.0158,
"learning_rate": 0.0002,
"epoch": 0.72,
"step": 41
},
{
"loss": 0.0097,
"learning_rate": 0.0002,
"epoch": 0.74,
"step": 42
},
{
"loss": 0.0104,
"learning_rate": 0.0002,
"epoch": 0.75,
"step": 43
},
{
"loss": 0.0854,
"learning_rate": 0.0002,
"epoch": 0.77,
"step": 44
},
{
"loss": 0.0115,
"learning_rate": 0.0002,
"epoch": 0.79,
"step": 45
},
{
"loss": 0.0903,
"learning_rate": 0.0002,
"epoch": 0.81,
"step": 46
},
{
"loss": 0.0082,
"learning_rate": 0.0002,
"epoch": 0.82,
"step": 47
},
{
"loss": 0.0841,
"learning_rate": 0.0002,
"epoch": 0.84,
"step": 48
},
{
"loss": 0.0379,
"learning_rate": 0.0002,
"epoch": 0.86,
"step": 49
},
{
"loss": 0.1163,
"learning_rate": 0.0002,
"epoch": 0.88,
"step": 50
},
{
"eval_code_easy_loss": 0.28712284564971924,
"eval_code_easy_score": -0.026069259271025658,
"eval_code_easy_brier_score": 0.026069259271025658,
"eval_code_easy_average_probability": 0.9709805250167847,
"eval_code_easy_accuracy": 0.97,
"eval_code_easy_probabilities": [
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999997615814209,
0.9602830410003662,
1.0,
1.0,
0.9999963045120239,
0.999914288520813,
0.9999732971191406,
0.9999974966049194,
1.0,
1.0,
0.9866946935653687,
1.0,
1.0,
0.9999997615814209,
0.9994608759880066,
0.9999551773071289,
1.0,
1.0,
1.0,
1.0,
1.0,
0.999995231628418,
0.9999997615814209,
0.9999998807907104,
1.0,
0.9999250173568726,
0.9999978542327881,
0.9999946355819702,
0.9998421669006348,
0.9999990463256836,
0.9997969269752502,
0.9818890690803528,
1.0,
0.9999922513961792,
0.9999998807907104,
0.9999998807907104,
0.9999998807907104,
1.0,
1.0,
1.0,
0.9997735619544983,
0.9998974800109863,
0.9999257326126099,
0.9999967813491821,
0.9999998807907104,
0.9999998807907104,
0.9922711849212646,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.223012313246727,
0.9999998807907104,
1.0,
1.0,
0.9999990463256836,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9665756225585938,
4.0422314384613856e-08,
4.318383798818104e-05,
1.0,
1.0,
1.0,
0.9998561143875122,
0.999182403087616,
0.9999680519104004,
1.0,
1.0,
1.0,
0.9999822378158569,
1.0,
1.0,
0.9959767460823059,
0.9999539852142334,
0.9995007514953613,
0.9999942779541016,
0.9996492862701416,
0.9998260140419006,
1.0,
0.9949652552604675,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0
],
"eval_code_easy_runtime": 41.3563,
"eval_code_easy_samples_per_second": 2.418,
"eval_code_easy_steps_per_second": 0.097,
"epoch": 0.88,
"step": 50
},
{
"eval_code_hard_loss": 0.9237764477729797,
"eval_code_hard_score": -0.20848987996578217,
"eval_code_hard_brier_score": 0.20848987996578217,
"eval_code_hard_average_probability": 0.683417558670044,
"eval_code_hard_accuracy": 0.71,
"eval_code_hard_probabilities": [
0.9991462230682373,
0.39208656549453735,
0.4176894426345825,
0.999220609664917,
0.9982213377952576,
0.9070152640342712,
0.15849868953227997,
0.28745439648628235,
0.3027569651603699,
0.24870805442333221,
0.7417134642601013,
0.5444478392601013,
0.9999140501022339,
0.0021548818331211805,
0.00024593042326159775,
0.9696754217147827,
0.9635093212127686,
0.9924002885818481,
0.00320712779648602,
0.004237341228872538,
0.000593981530983001,
0.9999964237213135,
0.9995344877243042,
0.999998927116394,
0.6726424098014832,
0.20489203929901123,
0.906218409538269,
0.1464991718530655,
0.8866965770721436,
0.9025827050209045,
0.9838942885398865,
0.9865344762802124,
0.4193040132522583,
0.9865899085998535,
0.9603983759880066,
0.958928644657135,
0.6753811240196228,
0.573758602142334,
0.6913469433784485,
0.3839159607887268,
0.42377495765686035,
0.9371411204338074,
0.997376561164856,
0.9381016492843628,
0.9976379871368408,
0.9994822144508362,
0.5902647376060486,
0.583461582660675,
0.9944129586219788,
0.9991785883903503,
0.9986459612846375,
0.012307150289416313,
0.8033295273780823,
0.9979121088981628,
0.00042291387217119336,
0.0005228969966992736,
0.00923232827335596,
0.7242734432220459,
0.6451666951179504,
0.7488073110580444,
0.3765398859977722,
0.14819785952568054,
0.39486005902290344,
0.6967870593070984,
0.8443142175674438,
0.9988842606544495,
0.9835836291313171,
0.9990014433860779,
0.9992020726203918,
0.9539203643798828,
0.9750897288322449,
0.850548267364502,
0.8060330152511597,
0.9476742744445801,
0.9418892860412598,
0.9725985527038574,
0.17615075409412384,
0.5268995761871338,
0.5463316440582275,
0.7340309023857117,
0.45826229453086853,
0.758548378944397,
0.9831669926643372,
0.8220421671867371,
0.9986447691917419,
0.9994031190872192,
0.9962872266769409,
0.7291285395622253,
0.8422561883926392,
0.7621178030967712,
0.4166759252548218,
0.4946196973323822,
0.4451850652694702,
0.7629806995391846,
0.7204477190971375,
0.7885748744010925,
0.6446090340614319,
0.8708204030990601,
0.32380175590515137,
0.9781871438026428
],
"eval_code_hard_runtime": 140.1048,
"eval_code_hard_samples_per_second": 0.714,
"eval_code_hard_steps_per_second": 0.029,
"epoch": 0.88,
"step": 50
},
{
"loss": 0.0203,
"learning_rate": 0.0002,
"epoch": 0.89,
"step": 51
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 0.91,
"step": 52
},
{
"loss": 0.0373,
"learning_rate": 0.0002,
"epoch": 0.93,
"step": 53
},
{
"loss": 0.2778,
"learning_rate": 0.0002,
"epoch": 0.95,
"step": 54
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 0.96,
"step": 55
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 0.98,
"step": 56
},
{
"loss": 0.0148,
"learning_rate": 0.0002,
"epoch": 1.0,
"step": 57
},
{
"loss": 0.0051,
"learning_rate": 0.0002,
"epoch": 1.02,
"step": 58
},
{
"loss": 0.0092,
"learning_rate": 0.0002,
"epoch": 1.04,
"step": 59
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 1.05,
"step": 60
},
{
"loss": 0.1744,
"learning_rate": 0.0002,
"epoch": 1.07,
"step": 61
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 1.09,
"step": 62
},
{
"loss": 0.0018,
"learning_rate": 0.0002,
"epoch": 1.11,
"step": 63
},
{
"loss": 0.0078,
"learning_rate": 0.0002,
"epoch": 1.12,
"step": 64
},
{
"loss": 0.0121,
"learning_rate": 0.0002,
"epoch": 1.14,
"step": 65
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 1.16,
"step": 66
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 1.18,
"step": 67
},
{
"loss": 0.0188,
"learning_rate": 0.0002,
"epoch": 1.19,
"step": 68
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 1.21,
"step": 69
},
{
"loss": 0.0007,
"learning_rate": 0.0002,
"epoch": 1.23,
"step": 70
},
{
"loss": 0.0112,
"learning_rate": 0.0002,
"epoch": 1.25,
"step": 71
},
{
"loss": 0.0034,
"learning_rate": 0.0002,
"epoch": 1.26,
"step": 72
},
{
"loss": 0.0012,
"learning_rate": 0.0002,
"epoch": 1.28,
"step": 73
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.3,
"step": 74
},
{
"loss": 0.0246,
"learning_rate": 0.0002,
"epoch": 1.32,
"step": 75
},
{
"eval_code_easy_loss": 0.18898575007915497,
"eval_code_easy_score": -0.02407282404601574,
"eval_code_easy_brier_score": 0.02407282404601574,
"eval_code_easy_average_probability": 0.9731456637382507,
"eval_code_easy_accuracy": 0.97,
"eval_code_easy_probabilities": [
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9942795038223267,
0.9999982118606567,
1.0,
0.9999651908874512,
0.9998317956924438,
0.9999611377716064,
0.9999415874481201,
1.0,
1.0,
0.9984660148620605,
1.0,
1.0,
1.0,
0.9995312690734863,
0.9939040541648865,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999691247940063,
0.9999864101409912,
0.9999852180480957,
0.9999997615814209,
0.9999762773513794,
0.9999992847442627,
0.9999895095825195,
0.9994505047798157,
0.9999997615814209,
0.9999996423721313,
0.999316930770874,
1.0,
0.9999549388885498,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9999998807907104,
0.9999992847442627,
0.9991188645362854,
0.9999963045120239,
1.0,
1.0,
1.0,
0.9998277425765991,
1.0,
1.0,
0.9999997615814209,
1.0,
1.0,
1.0,
0.3605167269706726,
1.0,
1.0,
1.0,
0.9999949932098389,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.97076416015625,
1.4138274309516419e-05,
0.001279860152862966,
1.0,
1.0,
1.0,
0.9999953508377075,
0.999148964881897,
0.9999984502792358,
1.0,
1.0,
1.0,
0.9999393224716187,
1.0,
1.0,
0.9999922513961792,
1.0,
0.9999986886978149,
0.9999806880950928,
0.9999102354049683,
0.9999845027923584,
1.0,
0.9995985627174377,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0
],
"eval_code_easy_runtime": 41.4851,
"eval_code_easy_samples_per_second": 2.411,
"eval_code_easy_steps_per_second": 0.096,
"epoch": 1.32,
"step": 75
},
{
"eval_code_hard_loss": 2.2544667720794678,
"eval_code_hard_score": -0.2460768073797226,
"eval_code_hard_brier_score": 0.2460768073797226,
"eval_code_hard_average_probability": 0.6746283173561096,
"eval_code_hard_accuracy": 0.71,
"eval_code_hard_probabilities": [
0.9999983310699463,
0.5661250948905945,
0.7090879678726196,
0.09080829471349716,
0.09405586123466492,
6.130974361440167e-05,
0.24737045168876648,
0.201746866106987,
0.3449346125125885,
0.14900989830493927,
0.7652262449264526,
0.5247918367385864,
0.9998658895492554,
1.7507378657910522e-08,
2.665373033394758e-09,
0.9900109171867371,
0.9922283291816711,
0.9896736145019531,
3.136615077892202e-06,
9.850871720118448e-06,
1.0493128002053709e-06,
0.9999830722808838,
0.9980818033218384,
0.999981164932251,
0.9334778189659119,
0.28829115629196167,
0.9874013066291809,
0.9867030382156372,
0.9521355032920837,
0.975749135017395,
0.9921451210975647,
0.998805046081543,
0.6474704742431641,
0.9896721839904785,
0.9654123783111572,
0.9551592469215393,
0.12296662479639053,
0.17879928648471832,
0.9942314624786377,
0.29071682691574097,
0.26718518137931824,
0.9962670207023621,
0.9932090640068054,
0.9184593558311462,
0.9924524426460266,
0.9999681711196899,
0.5355503559112549,
0.62375807762146,
0.9999186992645264,
0.9999804496765137,
0.9999536275863647,
0.0012312890030443668,
0.9840332865715027,
0.9999861717224121,
1.4762352407160506e-07,
1.6458953666642628e-07,
1.1647493920463603e-05,
0.6963649988174438,
0.5160571932792664,
0.5119415521621704,
2.806163301727338e-08,
6.523485085452307e-10,
1.9155359964884155e-08,
0.9288567304611206,
0.9914976954460144,
0.999998927116394,
0.9736488461494446,
0.9999374151229858,
0.9989074468612671,
0.9604309797286987,
0.9418864250183105,
0.9515325427055359,
0.9813504219055176,
0.9903180599212646,
0.9985818862915039,
0.9873167276382446,
0.12791942059993744,
0.40380606055259705,
0.5523675680160522,
0.7548352479934692,
0.46443045139312744,
0.9042721390724182,
0.9984411597251892,
0.9024229645729065,
0.9884786009788513,
0.9960446357727051,
0.940305769443512,
0.784172534942627,
0.862592339515686,
0.6879691481590271,
0.41794973611831665,
0.5900482535362244,
0.540920078754425,
0.8815944194793701,
0.8355022668838501,
0.9159291982650757,
0.8655431866645813,
0.9957410097122192,
0.4074825942516327,
0.9812780022621155
],
"eval_code_hard_runtime": 140.1017,
"eval_code_hard_samples_per_second": 0.714,
"eval_code_hard_steps_per_second": 0.029,
"epoch": 1.32,
"step": 75
},
{
"loss": 0.0063,
"learning_rate": 0.0002,
"epoch": 1.33,
"step": 76
},
{
"loss": 0.0109,
"learning_rate": 0.0002,
"epoch": 1.35,
"step": 77
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 1.37,
"step": 78
},
{
"loss": 0.0854,
"learning_rate": 0.0002,
"epoch": 1.39,
"step": 79
},
{
"loss": 0.0327,
"learning_rate": 0.0002,
"epoch": 1.4,
"step": 80
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 1.42,
"step": 81
},
{
"loss": 0.0705,
"learning_rate": 0.0002,
"epoch": 1.44,
"step": 82
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.46,
"step": 83
},
{
"loss": 0.0031,
"learning_rate": 0.0002,
"epoch": 1.47,
"step": 84
},
{
"loss": 0.0199,
"learning_rate": 0.0002,
"epoch": 1.49,
"step": 85
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.51,
"step": 86
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.53,
"step": 87
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 1.54,
"step": 88
},
{
"loss": 0.237,
"learning_rate": 0.0002,
"epoch": 1.56,
"step": 89
},
{
"loss": 0.0064,
"learning_rate": 0.0002,
"epoch": 1.58,
"step": 90
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 1.6,
"step": 91
},
{
"loss": 0.0021,
"learning_rate": 0.0002,
"epoch": 1.61,
"step": 92
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 1.63,
"step": 93
},
{
"loss": 0.0019,
"learning_rate": 0.0002,
"epoch": 1.65,
"step": 94
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 1.67,
"step": 95
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 1.68,
"step": 96
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.7,
"step": 97
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.72,
"step": 98
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 1.74,
"step": 99
},
{
"loss": 0.0016,
"learning_rate": 0.0002,
"epoch": 1.75,
"step": 100
},
{
"eval_code_easy_loss": 0.25820469856262207,
"eval_code_easy_score": -0.020117390900850296,
"eval_code_easy_brier_score": 0.020117390900850296,
"eval_code_easy_average_probability": 0.9781191945075989,
"eval_code_easy_accuracy": 0.98,
"eval_code_easy_probabilities": [
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9856951832771301,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9999998807907104,
0.8996143937110901,
1.0,
1.0,
0.9800459146499634,
1.0,
1.0,
1.0,
0.9999831914901733,
0.9999853372573853,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999538660049438,
0.9999998807907104,
1.0,
1.0,
0.9999990463256836,
1.0,
0.9999998807907104,
0.9980992674827576,
0.999997615814209,
0.9975267052650452,
0.9988257288932,
1.0,
0.9999734163284302,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999279975891113,
1.0,
1.0,
1.0,
1.0,
0.9663723707199097,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999686479568481,
1.0,
1.0,
1.0,
0.999997615814209,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9941490888595581,
9.479013840518746e-08,
7.865727820899338e-05,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9985870122909546,
1.0,
1.0,
1.0,
1.0,
0.9996020197868347,
1.0,
1.0,
0.9999988079071045,
1.0,
0.9999998807907104,
0.9997178912162781,
0.9999922513961792,
0.9999991655349731,
1.0,
0.9938370585441589,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0
],
"eval_code_easy_runtime": 41.4766,
"eval_code_easy_samples_per_second": 2.411,
"eval_code_easy_steps_per_second": 0.096,
"epoch": 1.75,
"step": 100
},
{
"eval_code_hard_loss": 2.8355469703674316,
"eval_code_hard_score": -0.24508047103881836,
"eval_code_hard_brier_score": 0.24508047103881836,
"eval_code_hard_average_probability": 0.6834875345230103,
"eval_code_hard_accuracy": 0.71,
"eval_code_hard_probabilities": [
1.0,
0.49802687764167786,
0.7207960486412048,
0.01915053464472294,
0.022134896367788315,
4.0801442082738504e-05,
0.3737213611602783,
0.2865481376647949,
0.30831632018089294,
0.24947436153888702,
0.7978243231773376,
0.5949852466583252,
0.9999364614486694,
2.1756743628920105e-10,
2.9773794540943754e-11,
0.9936490654945374,
0.9942991733551025,
0.993448793888092,
3.583797980599712e-10,
3.8425835846567225e-09,
2.1109008985220612e-10,
0.9996128678321838,
0.9975799322128296,
0.9994070529937744,
0.9748783707618713,
0.47572091221809387,
0.996880054473877,
0.9991859793663025,
0.987097442150116,
0.9944655299186707,
0.9830182790756226,
0.995845377445221,
0.5017166137695312,
0.9952012300491333,
0.8540241122245789,
0.9487936496734619,
0.02690940722823143,
0.03413669392466545,
0.9999390840530396,
0.14402766525745392,
0.1746188849210739,
0.9748719930648804,
0.9814805388450623,
0.9264845848083496,
0.974022388458252,
0.9999991655349731,
0.7958990931510925,
0.6329552531242371,
0.9999284744262695,
0.9999613761901855,
0.9999935626983643,
8.354127930942923e-05,
0.9636399149894714,
0.999997615814209,
5.748397313709575e-10,
4.4799397524997175e-10,
1.1092028273651522e-07,
0.7891486883163452,
0.5943530797958374,
0.6597400307655334,
3.084578281686845e-08,
1.9499866998895499e-10,
7.682257319174823e-08,
0.988332211971283,
0.9993404746055603,
0.9999953508377075,
0.7918521761894226,
0.9975425004959106,
0.9782871603965759,
0.9723710417747498,
0.973602831363678,
0.9903439283370972,
0.9704287052154541,
0.9830175638198853,
0.9929106831550598,
0.9866513013839722,
0.16249682009220123,
0.3364860415458679,
0.5504053235054016,
0.8576055765151978,
0.5424798727035522,
0.9613667130470276,
0.9995546936988831,
0.8739398717880249,
0.9984847903251648,
0.9997493624687195,
0.980169951915741,
0.8975971341133118,
0.9636164903640747,
0.7637275457382202,
0.5357650518417358,
0.6792539358139038,
0.39096373319625854,
0.951950192451477,
0.8796238899230957,
0.9461458921432495,
0.7978929281234741,
0.991081178188324,
0.4479399621486664,
0.9878178834915161
],
"eval_code_hard_runtime": 140.1067,
"eval_code_hard_samples_per_second": 0.714,
"eval_code_hard_steps_per_second": 0.029,
"epoch": 1.75,
"step": 100
},
{
"train_runtime": 4333.8818,
"train_samples_per_second": 0.738,
"train_steps_per_second": 0.023,
"total_flos": 0.0,
"train_loss": 0.09087586780193589,
"epoch": 1.75,
"step": 100
}
]