llama-30b-comma_separated_input / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
4ddb85a
Invalid JSON:Unexpected token ':', ..."accuracy"::0.77, "... is not valid JSON
[
{
"loss": 0.7419,
"learning_rate": 0.0002,
"epoch": 0.02,
"step": 1
},
{
"loss": 0.7104,
"learning_rate": 0.0002,
"epoch": 0.04,
"step": 2
},
{
"loss": 0.6951,
"learning_rate": 0.0002,
"epoch": 0.05,
"step": 3
},
{
"loss": 0.6797,
"learning_rate": 0.0002,
"epoch": 0.07,
"step": 4
},
{
"loss": 0.6777,
"learning_rate": 0.0002,
"epoch": 0.09,
"step": 5
},
{
"loss": 0.6727,
"learning_rate": 0.0002,
"epoch": 0.11,
"step": 6
},
{
"loss": 0.6902,
"learning_rate": 0.0002,
"epoch": 0.12,
"step": 7
},
{
"loss": 0.644,
"learning_rate": 0.0002,
"epoch": 0.14,
"step": 8
},
{
"loss": 0.6332,
"learning_rate": 0.0002,
"epoch": 0.16,
"step": 9
},
{
"loss": 0.6259,
"learning_rate": 0.0002,
"epoch": 0.18,
"step": 10
},
{
"loss": 0.5662,
"learning_rate": 0.0002,
"epoch": 0.19,
"step": 11
},
{
"loss": 0.4973,
"learning_rate": 0.0002,
"epoch": 0.21,
"step": 12
},
{
"loss": 0.4677,
"learning_rate": 0.0002,
"epoch": 0.23,
"step": 13
},
{
"loss": 0.3896,
"learning_rate": 0.0002,
"epoch": 0.25,
"step": 14
},
{
"loss": 0.5832,
"learning_rate": 0.0002,
"epoch": 0.26,
"step": 15
},
{
"loss": 0.2747,
"learning_rate": 0.0002,
"epoch": 0.28,
"step": 16
},
{
"loss": 0.3438,
"learning_rate": 0.0002,
"epoch": 0.3,
"step": 17
},
{
"loss": 0.2304,
"learning_rate": 0.0002,
"epoch": 0.32,
"step": 18
},
{
"loss": 0.2208,
"learning_rate": 0.0002,
"epoch": 0.33,
"step": 19
},
{
"loss": 0.3179,
"learning_rate": 0.0002,
"epoch": 0.35,
"step": 20
},
{
"loss": 0.3831,
"learning_rate": 0.0002,
"epoch": 0.37,
"step": 21
},
{
"loss": 0.3274,
"learning_rate": 0.0002,
"epoch": 0.39,
"step": 22
},
{
"loss": 0.3322,
"learning_rate": 0.0002,
"epoch": 0.4,
"step": 23
},
{
"loss": 0.1843,
"learning_rate": 0.0002,
"epoch": 0.42,
"step": 24
},
{
"loss": 0.3792,
"learning_rate": 0.0002,
"epoch": 0.44,
"step": 25
},
{
"eval_comma_separated_input_loss": 0.47381076216697693,
"eval_comma_separated_input_score": -0.14903230965137482,
"eval_comma_separated_input_brier_score": 0.14903230965137482,
"eval_comma_separated_input_average_probability": 0.739839494228363,
"eval_comma_separated_input_accuracy": 0.76,
"eval_comma_separated_input_probabilities": [
0.5057103037834167,
0.7926411032676697,
0.8395572304725647,
0.8750540614128113,
0.6638176441192627,
0.3412554860115051,
0.8521225452423096,
0.7427878975868225,
0.48845282196998596,
0.9979581832885742,
0.9965298771858215,
0.9844328165054321,
0.4072255790233612,
0.4754917323589325,
0.2266879379749298,
0.9544909000396729,
0.9932397603988647,
0.9822323322296143,
0.9549546241760254,
0.9956372380256653,
0.8111849427223206,
0.6678183674812317,
0.9605175256729126,
0.6721541285514832,
0.9995113611221313,
0.9995362758636475,
0.9969425797462463,
0.7482375502586365,
0.978789746761322,
0.9411532282829285,
0.8092716336250305,
0.5804548263549805,
0.8987478613853455,
0.9926584362983704,
0.9968037605285645,
0.9899746775627136,
0.5884284973144531,
0.6909584999084473,
0.7130376100540161,
0.984264612197876,
0.8204785585403442,
0.6899394392967224,
0.7373196482658386,
0.5578603148460388,
0.4814424216747284,
0.9995312690734863,
0.9998726844787598,
0.9916493892669678,
0.9987574815750122,
0.8930770754814148,
0.9631037712097168,
0.9723063707351685,
0.867325484752655,
0.8623606562614441,
0.9999880790710449,
0.9999451637268066,
0.999957799911499,
0.3165142834186554,
0.5785897970199585,
0.4601801335811615,
0.9999808073043823,
0.9999685287475586,
0.9999656677246094,
0.3123607933521271,
0.3744247555732727,
0.27252867817878723,
0.9987949132919312,
0.9992828965187073,
0.9993246793746948,
0.5784086585044861,
0.15536504983901978,
0.23488140106201172,
0.14060163497924805,
0.11246518045663834,
0.3872424066066742,
0.9960883855819702,
0.9901509284973145,
0.9042060375213623,
0.010595398023724556,
0.019154399633407593,
0.10093849897384644,
0.6121878623962402,
0.4093835949897766,
0.6347980499267578,
0.992620050907135,
0.7581243515014648,
0.9930395483970642,
0.374697744846344,
0.3880426585674286,
0.37667402625083923,
0.751455545425415,
0.6910660862922668,
0.4043519198894501,
0.9727478623390198,
0.9151681661605835,
0.9926292896270752,
0.9967435598373413,
0.8987772464752197,
0.9539257884025574,
0.9998562335968018
],
"eval_comma_separated_input_runtime": 78.0564,
"eval_comma_separated_input_samples_per_second": 1.281,
"eval_comma_separated_input_steps_per_second": 0.051,
"epoch": 0.44,
"step": 25
},
{
"loss": 0.326,
"learning_rate": 0.0002,
"epoch": 0.46,
"step": 26
},
{
"loss": 0.5505,
"learning_rate": 0.0002,
"epoch": 0.47,
"step": 27
},
{
"loss": 0.254,
"learning_rate": 0.0002,
"epoch": 0.49,
"step": 28
},
{
"loss": 0.3024,
"learning_rate": 0.0002,
"epoch": 0.51,
"step": 29
},
{
"loss": 0.1145,
"learning_rate": 0.0002,
"epoch": 0.53,
"step": 30
},
{
"loss": 0.2487,
"learning_rate": 0.0002,
"epoch": 0.54,
"step": 31
},
{
"loss": 0.2536,
"learning_rate": 0.0002,
"epoch": 0.56,
"step": 32
},
{
"loss": 0.2752,
"learning_rate": 0.0002,
"epoch": 0.58,
"step": 33
},
{
"loss": 0.2864,
"learning_rate": 0.0002,
"epoch": 0.6,
"step": 34
},
{
"loss": 0.308,
"learning_rate": 0.0002,
"epoch": 0.61,
"step": 35
},
{
"loss": 0.2412,
"learning_rate": 0.0002,
"epoch": 0.63,
"step": 36
},
{
"loss": 0.4188,
"learning_rate": 0.0002,
"epoch": 0.65,
"step": 37
},
{
"loss": 0.3539,
"learning_rate": 0.0002,
"epoch": 0.67,
"step": 38
},
{
"loss": 0.4126,
"learning_rate": 0.0002,
"epoch": 0.68,
"step": 39
},
{
"loss": 0.2298,
"learning_rate": 0.0002,
"epoch": 0.7,
"step": 40
},
{
"loss": 0.1837,
"learning_rate": 0.0002,
"epoch": 0.72,
"step": 41
},
{
"loss": 0.2238,
"learning_rate": 0.0002,
"epoch": 0.74,
"step": 42
},
{
"loss": 0.3062,
"learning_rate": 0.0002,
"epoch": 0.75,
"step": 43
},
{
"loss": 0.3335,
"learning_rate": 0.0002,
"epoch": 0.77,
"step": 44
},
{
"loss": 0.128,
"learning_rate": 0.0002,
"epoch": 0.79,
"step": 45
},
{
"loss": 0.2156,
"learning_rate": 0.0002,
"epoch": 0.81,
"step": 46
},
{
"loss": 0.1373,
"learning_rate": 0.0002,
"epoch": 0.82,
"step": 47
},
{
"loss": 0.2333,
"learning_rate": 0.0002,
"epoch": 0.84,
"step": 48
},
{
"loss": 0.3292,
"learning_rate": 0.0002,
"epoch": 0.86,
"step": 49
},
{
"loss": 0.3278,
"learning_rate": 0.0002,
"epoch": 0.88,
"step": 50
},
{
"eval_comma_separated_input_loss": 0.447895348072052,
"eval_comma_separated_input_score": -0.14565807580947876,
"eval_comma_separated_input_brier_score": 0.14565807580947876,
"eval_comma_separated_input_average_probability": 0.7761557102203369,
"eval_comma_separated_input_accuracy": 0.77,
"eval_comma_separated_input_probabilities": [
0.4504460096359253,
0.7106965780258179,
0.7613977193832397,
0.27627503871917725,
0.1888580322265625,
0.36196234822273254,
0.9977447986602783,
0.9934731125831604,
0.9807383418083191,
0.9999233484268188,
0.9998125433921814,
0.9992616772651672,
0.42937251925468445,
0.35414958000183105,
0.3341814875602722,
0.9967638254165649,
0.9999350309371948,
0.9995962977409363,
0.9546691179275513,
0.9990658164024353,
0.99967360496521,
0.9045127034187317,
0.9956008195877075,
0.9143818020820618,
0.999998927116394,
0.9999983310699463,
0.999935507774353,
0.9908632636070251,
0.9999735355377197,
0.9989373087882996,
0.9830892086029053,
0.8966995477676392,
0.9865294694900513,
0.9999994039535522,
0.9999998807907104,
0.9999971389770508,
0.49074265360832214,
0.5514218211174011,
0.830772876739502,
0.9999492168426514,
0.8612533807754517,
0.9519673585891724,
0.9873406291007996,
0.8993487358093262,
0.8438679575920105,
0.9999995231628418,
0.9999996423721313,
0.9998364448547363,
0.999634861946106,
0.9831734299659729,
0.9952573180198669,
0.9982624650001526,
0.9984625577926636,
0.9621893167495728,
0.9999992847442627,
0.9999982118606567,
0.9999990463256836,
0.17832396924495697,
0.6987086534500122,
0.43089836835861206,
0.9999967813491821,
0.9999840259552002,
0.9999971389770508,
0.34186333417892456,
0.6733885407447815,
0.4354130029678345,
0.9825000762939453,
0.9815826416015625,
0.9878876209259033,
0.6807180047035217,
0.09687728434801102,
0.16909901797771454,
0.5602892637252808,
0.5863568186759949,
0.608674943447113,
0.9987614154815674,
0.997982382774353,
0.972231388092041,
0.02466653659939766,
0.0528080128133297,
0.2097661793231964,
0.9776371717453003,
0.5767873525619507,
0.9074500203132629,
0.9864820241928101,
0.5367009043693542,
0.9760178327560425,
0.06482303142547607,
0.1236090213060379,
0.1919964700937271,
0.3480866849422455,
0.38676121830940247,
0.15342266857624054,
0.9814541935920715,
0.9267071485519409,
0.9979047775268555,
0.9999786615371704,
0.9992477893829346,
0.9997554421424866,
0.9999927282333374
],
"eval_comma_separated_input_runtime": 78.026,
"eval_comma_separated_input_samples_per_second": 1.282,
"eval_comma_separated_input_steps_per_second": 0.051,
"epoch": 0.88,
"step": 50
},
{
"loss": 0.1712,
"learning_rate": 0.0002,
"epoch": 0.89,
"step": 51
},
{
"loss": 0.1149,
"learning_rate": 0.0002,
"epoch": 0.91,
"step": 52
},
{
"loss": 0.1877,
"learning_rate": 0.0002,
"epoch": 0.93,
"step": 53
},
{
"loss": 0.0817,
"learning_rate": 0.0002,
"epoch": 0.95,
"step": 54
},
{
"loss": 0.0424,
"learning_rate": 0.0002,
"epoch": 0.96,
"step": 55
},
{
"loss": 0.2838,
"learning_rate": 0.0002,
"epoch": 0.98,
"step": 56
},
{
"loss": 0.1558,
"learning_rate": 0.0002,
"epoch": 1.0,
"step": 57
},
{
"loss": 0.0269,
"learning_rate": 0.0002,
"epoch": 1.02,
"step": 58
},
{
"loss": 0.0916,
"learning_rate": 0.0002,
"epoch": 1.04,
"step": 59
},
{
"loss": 0.0162,
"learning_rate": 0.0002,
"epoch": 1.05,
"step": 60
},
{
"loss": 0.0182,
"learning_rate": 0.0002,
"epoch": 1.07,
"step": 61
},
{
"loss": 0.0505,
"learning_rate": 0.0002,
"epoch": 1.09,
"step": 62
},
{
"loss": 0.1672,
"learning_rate": 0.0002,
"epoch": 1.11,
"step": 63
},
{
"loss": 0.0078,
"learning_rate": 0.0002,
"epoch": 1.12,
"step": 64
},
{
"loss": 0.0239,
"learning_rate": 0.0002,
"epoch": 1.14,
"step": 65
},
{
"loss": 0.0042,
"learning_rate": 0.0002,
"epoch": 1.16,
"step": 66
},
{
"loss": 0.1157,
"learning_rate": 0.0002,
"epoch": 1.18,
"step": 67
},
{
"loss": 0.0367,
"learning_rate": 0.0002,
"epoch": 1.19,
"step": 68
},
{
"loss": 0.0054,
"learning_rate": 0.0002,
"epoch": 1.21,
"step": 69
},
{
"loss": 0.3269,
"learning_rate": 0.0002,
"epoch": 1.23,
"step": 70
},
{
"loss": 0.0053,
"learning_rate": 0.0002,
"epoch": 1.25,
"step": 71
},
{
"loss": 0.0093,
"learning_rate": 0.0002,
"epoch": 1.26,
"step": 72
},
{
"loss": 0.06,
"learning_rate": 0.0002,
"epoch": 1.28,
"step": 73
},
{
"loss": 0.0214,
"learning_rate": 0.0002,
"epoch": 1.3,
"step": 74
},
{
"loss": 0.064,
"learning_rate": 0.0002,
"epoch": 1.32,
"step": 75
},
{
"eval_comma_separated_input_loss": 0.6194826364517212,
"eval_comma_separated_input_score": -0.17542152106761932,
"eval_comma_separated_input_brier_score": 0.17542152106761932,
"eval_comma_separated_input_average_probability": 0.7849389910697937,
"eval_comma_separated_input_accuracy"::0.77,
"eval_comma_separated_input_probabilities": [
0.3327490985393524,
0.9519062042236328,
0.9847831130027771,
0.5636963844299316,
0.031850676983594894,
0.05631185695528984,
0.9998056292533875,
0.9995859265327454,
0.990744411945343,
1.0,
1.0,
1.0,
0.9468281865119934,
0.8348178863525391,
0.23293766379356384,
0.9999988079071045,
1.0,
1.0,
0.9999995231628418,
1.0,
1.0,
0.9823529124259949,
0.9999111890792847,
0.9437704086303711,
1.0,
1.0,
0.9999995231628418,
0.9999985694885254,
1.0,
0.9999997615814209,
0.9999955892562866,
0.9999785423278809,
0.9999979734420776,
1.0,
1.0,
1.0,
0.15389743447303772,
0.8275808095932007,
0.9833057522773743,
1.0,
0.9276348948478699,
0.9925111532211304,
0.9999544620513916,
0.9182303547859192,
0.5098273158073425,
1.0,
1.0,
0.9999983310699463,
1.0,
0.9999970197677612,
0.9999997615814209,
0.9999984502792358,
0.9999997615814209,
0.9999309778213501,
1.0,
1.0,
1.0,
0.1305040717124939,
0.9028104543685913,
0.21933555603027344,
0.9999996423721313,
0.9999996423721313,
0.9999997615814209,
0.059167250990867615,
0.2488248497247696,
0.06632068753242493,
0.9999988079071045,
0.9999992847442627,
0.9999998807907104,
0.9473620057106018,
0.26638561487197876,
0.07780053466558456,
0.11167240887880325,
0.0027452881913632154,
0.3228246569633484,
0.9999821186065674,
0.999972939491272,
0.9944614171981812,
0.03967156261205673,
0.20487765967845917,
0.9539350271224976,
0.9898837208747864,
0.9399700164794922,
0.9973479509353638,
0.9999980926513672,
0.9816005229949951,
0.9999972581863403,
0.011794282123446465,
0.002413914306089282,
0.05205608159303665,
0.3445022404193878,
0.4484536349773407,
0.01951614022254944,
0.9997747540473938,
0.9940212368965149,
0.9999996423721313,
0.9999850988388062,
0.9991033673286438,
0.9999384880065918,
1.0
],
"eval_comma_separated_input_runtime": 78.0706,
"eval_comma_separated_input_samples_per_second": 1.281,
"eval_comma_separated_input_steps_per_second": 0.051,
"epoch": 1.32,
"step": 75
},
{
"loss": 0.1843,
"learning_rate": 0.0002,
"epoch": 1.33,
"step": 76
},
{
"loss": 0.0102,
"learning_rate": 0.0002,
"epoch": 1.35,
"step": 77
},
{
"loss": 0.0016,
"learning_rate": 0.0002,
"epoch": 1.37,
"step": 78
},
{
"loss": 0.0847,
"learning_rate": 0.0002,
"epoch": 1.39,
"step": 79
},
{
"loss": 0.1682,
"learning_rate": 0.0002,
"epoch": 1.4,
"step": 80
},
{
"loss": 0.0202,
"learning_rate": 0.0002,
"epoch": 1.42,
"step": 81
},
{
"loss": 0.0717,
"learning_rate": 0.0002,
"epoch": 1.44,
"step": 82
},
{
"loss": 0.1845,
"learning_rate": 0.0002,
"epoch": 1.46,
"step": 83
},
{
"loss": 0.0604,
"learning_rate": 0.0002,
"epoch": 1.47,
"step": 84
},
{
"loss": 0.04,
"learning_rate": 0.0002,
"epoch": 1.49,
"step": 85
},
{
"loss": 0.1294,
"learning_rate": 0.0002,
"epoch": 1.51,
"step": 86
},
{
"loss": 0.0017,
"learning_rate": 0.0002,
"epoch": 1.53,
"step": 87
},
{
"loss": 0.0122,
"learning_rate": 0.0002,
"epoch": 1.54,
"step": 88
},
{
"loss": 0.1278,
"learning_rate": 0.0002,
"epoch": 1.56,
"step": 89
},
{
"loss": 0.0566,
"learning_rate": 0.0002,
"epoch": 1.58,
"step": 90
},
{
"loss": 0.0099,
"learning_rate": 0.0002,
"epoch": 1.6,
"step": 91
},
{
"loss": 0.0064,
"learning_rate": 0.0002,
"epoch": 1.61,
"step": 92
},
{
"loss": 0.0243,
"learning_rate": 0.0002,
"epoch": 1.63,
"step": 93
},
{
"loss": 0.0525,
"learning_rate": 0.0002,
"epoch": 1.65,
"step": 94
},
{
"loss": 0.0424,
"learning_rate": 0.0002,
"epoch": 1.67,
"step": 95
},
{
"loss": 0.0613,
"learning_rate": 0.0002,
"epoch": 1.68,
"step": 96
},
{
"loss": 0.0521,
"learning_rate": 0.0002,
"epoch": 1.7,
"step": 97
},
{
"loss": 0.0944,
"learning_rate": 0.0002,
"epoch": 1.72,
"step": 98
},
{
"loss": 0.0181,
"learning_rate": 0.0002,
"epoch": 1.74,
"step": 99
},
{
"loss": 0.0008,
"learning_rate": 0.0002,
"epoch": 1.75,
"step": 100
},
{
"eval_comma_separated_input_loss": 0.378570020198822,
"eval_comma_separated_input_score": -0.10282441228628159,
"eval_comma_separated_input_brier_score": 0.10282441228628159,
"eval_comma_separated_input_average_probability": 0.8461194038391113,
"eval_comma_separated_input_accuracy": 0.86,
"eval_comma_separated_input_probabilities": [
0.7394901514053345,
0.9556662440299988,
0.9631574153900146,
0.9448689818382263,
0.6851402521133423,
0.04673205316066742,
0.9999997615814209,
0.9999988079071045,
0.9999755620956421,
1.0,
1.0,
1.0,
0.8175366520881653,
0.5344929695129395,
0.40490445494651794,
0.9999028444290161,
0.9999998807907104,
0.9999815225601196,
0.9996824264526367,
0.9999032020568848,
0.9999306201934814,
0.9223772883415222,
0.9986610412597656,
0.9338085055351257,
1.0,
1.0,
0.9999598264694214,
0.9999997615814209,
1.0,
1.0,
0.9999829530715942,
0.9999233484268188,
0.9999957084655762,
1.0,
1.0,
1.0,
0.16704992949962616,
0.4352927505970001,
0.9530060291290283,
0.9999997615814209,
0.9648281931877136,
0.9776931405067444,
0.9999842643737793,
0.9146194458007812,
0.7172320485115051,
1.0,
0.9999998807907104,
0.9997580647468567,
1.0,
0.9999997615814209,
0.9999998807907104,
0.9999994039535522,
0.9999991655349731,
0.9998703002929688,
1.0,
1.0,
1.0,
0.43808406591415405,
0.5185633301734924,
0.47918856143951416,
1.0,
1.0,
1.0,
0.12787644565105438,,
0.8206732273101807,
0.6153414845466614,
0.9999388456344604,
0.9996930360794067,
0.9999504089355469,
0.9787357449531555,
0.20235727727413177,
0.06822255253791809,
0.8611693978309631,
0.46712806820869446,
0.9312974810600281,
1.0,
0.9999998807907104,
0.9988490343093872,
0.7939100861549377,
0.995577335357666,
0.995972216129303,
0.830564022064209,
0.9511353969573975,
0.9778002500534058,
0.9999828338623047,
0.9291109442710876,
0.9999287128448486,
0.007030226290225983,
0.002356813522055745,
0.04530631750822067,
0.569308340549469,
0.7886270880699158,
0.15891966223716736,
0.9987874627113342,
0.9973487854003906,
0.9999998807907104,
0.9999572038650513,
0.9878588318824768,
0.999981164932251,
1.0
],
"eval_comma_separated_input_runtime": 78.0074,
"eval_comma_separated_input_samples_per_second": 1.282,
"eval_comma_separated_input_steps_per_second": 0.051,
"epoch": 1.75,
"step": 100
},
{
"train_runtime": 5582.1468,
"train_samples_per_second": 0.573,
"train_steps_per_second": 0.018,
"total_flos": 0.0,
"train_loss": 0.22866786144091747,
"epoch": 1.75,
"step": 100
}
]