[ { "loss": 0.7419, "learning_rate": 0.0002, "epoch": 0.02, "step": 1 }, { "loss": 0.7104, "learning_rate": 0.0002, "epoch": 0.04, "step": 2 }, { "loss": 0.6951, "learning_rate": 0.0002, "epoch": 0.05, "step": 3 }, { "loss": 0.6797, "learning_rate": 0.0002, "epoch": 0.07, "step": 4 }, { "loss": 0.6777, "learning_rate": 0.0002, "epoch": 0.09, "step": 5 }, { "loss": 0.6727, "learning_rate": 0.0002, "epoch": 0.11, "step": 6 }, { "loss": 0.6902, "learning_rate": 0.0002, "epoch": 0.12, "step": 7 }, { "loss": 0.644, "learning_rate": 0.0002, "epoch": 0.14, "step": 8 }, { "loss": 0.6332, "learning_rate": 0.0002, "epoch": 0.16, "step": 9 }, { "loss": 0.6259, "learning_rate": 0.0002, "epoch": 0.18, "step": 10 }, { "loss": 0.5662, "learning_rate": 0.0002, "epoch": 0.19, "step": 11 }, { "loss": 0.4973, "learning_rate": 0.0002, "epoch": 0.21, "step": 12 }, { "loss": 0.4677, "learning_rate": 0.0002, "epoch": 0.23, "step": 13 }, { "loss": 0.3896, "learning_rate": 0.0002, "epoch": 0.25, "step": 14 }, { "loss": 0.5832, "learning_rate": 0.0002, "epoch": 0.26, "step": 15 }, { "loss": 0.2747, "learning_rate": 0.0002, "epoch": 0.28, "step": 16 }, { "loss": 0.3438, "learning_rate": 0.0002, "epoch": 0.3, "step": 17 }, { "loss": 0.2304, "learning_rate": 0.0002, "epoch": 0.32, "step": 18 }, { "loss": 0.2208, "learning_rate": 0.0002, "epoch": 0.33, "step": 19 }, { "loss": 0.3179, "learning_rate": 0.0002, "epoch": 0.35, "step": 20 }, { "loss": 0.3831, "learning_rate": 0.0002, "epoch": 0.37, "step": 21 }, { "loss": 0.3274, "learning_rate": 0.0002, "epoch": 0.39, "step": 22 }, { "loss": 0.3322, "learning_rate": 0.0002, "epoch": 0.4, "step": 23 }, { "loss": 0.1843, "learning_rate": 0.0002, "epoch": 0.42, "step": 24 }, { "loss": 0.3792, "learning_rate": 0.0002, "epoch": 0.44, "step": 25 }, { "eval_comma_separated_input_loss": 0.47381076216697693, "eval_comma_separated_input_score": -0.14903230965137482, "eval_comma_separated_input_brier_score": 0.14903230965137482, "eval_comma_separated_input_average_probability": 0.739839494228363, "eval_comma_separated_input_accuracy": 0.76, "eval_comma_separated_input_probabilities": [ 0.5057103037834167, 0.7926411032676697, 0.8395572304725647, 0.8750540614128113, 0.6638176441192627, 0.3412554860115051, 0.8521225452423096, 0.7427878975868225, 0.48845282196998596, 0.9979581832885742, 0.9965298771858215, 0.9844328165054321, 0.4072255790233612, 0.4754917323589325, 0.2266879379749298, 0.9544909000396729, 0.9932397603988647, 0.9822323322296143, 0.9549546241760254, 0.9956372380256653, 0.8111849427223206, 0.6678183674812317, 0.9605175256729126, 0.6721541285514832, 0.9995113611221313, 0.9995362758636475, 0.9969425797462463, 0.7482375502586365, 0.978789746761322, 0.9411532282829285, 0.8092716336250305, 0.5804548263549805, 0.8987478613853455, 0.9926584362983704, 0.9968037605285645, 0.9899746775627136, 0.5884284973144531, 0.6909584999084473, 0.7130376100540161, 0.984264612197876, 0.8204785585403442, 0.6899394392967224, 0.7373196482658386, 0.5578603148460388, 0.4814424216747284, 0.9995312690734863, 0.9998726844787598, 0.9916493892669678, 0.9987574815750122, 0.8930770754814148, 0.9631037712097168, 0.9723063707351685, 0.867325484752655, 0.8623606562614441, 0.9999880790710449, 0.9999451637268066, 0.999957799911499, 0.3165142834186554, 0.5785897970199585, 0.4601801335811615, 0.9999808073043823, 0.9999685287475586, 0.9999656677246094, 0.3123607933521271, 0.3744247555732727, 0.27252867817878723, 0.9987949132919312, 0.9992828965187073, 0.9993246793746948, 0.5784086585044861, 0.15536504983901978, 0.23488140106201172, 0.14060163497924805, 0.11246518045663834, 0.3872424066066742, 0.9960883855819702, 0.9901509284973145, 0.9042060375213623, 0.010595398023724556, 0.019154399633407593, 0.10093849897384644, 0.6121878623962402, 0.4093835949897766, 0.6347980499267578, 0.992620050907135, 0.7581243515014648, 0.9930395483970642, 0.374697744846344, 0.3880426585674286, 0.37667402625083923, 0.751455545425415, 0.6910660862922668, 0.4043519198894501, 0.9727478623390198, 0.9151681661605835, 0.9926292896270752, 0.9967435598373413, 0.8987772464752197, 0.9539257884025574, 0.9998562335968018 ], "eval_comma_separated_input_runtime": 78.0564, "eval_comma_separated_input_samples_per_second": 1.281, "eval_comma_separated_input_steps_per_second": 0.051, "epoch": 0.44, "step": 25 }, { "loss": 0.326, "learning_rate": 0.0002, "epoch": 0.46, "step": 26 }, { "loss": 0.5505, "learning_rate": 0.0002, "epoch": 0.47, "step": 27 }, { "loss": 0.254, "learning_rate": 0.0002, "epoch": 0.49, "step": 28 }, { "loss": 0.3024, "learning_rate": 0.0002, "epoch": 0.51, "step": 29 }, { "loss": 0.1145, "learning_rate": 0.0002, "epoch": 0.53, "step": 30 }, { "loss": 0.2487, "learning_rate": 0.0002, "epoch": 0.54, "step": 31 }, { "loss": 0.2536, "learning_rate": 0.0002, "epoch": 0.56, "step": 32 }, { "loss": 0.2752, "learning_rate": 0.0002, "epoch": 0.58, "step": 33 }, { "loss": 0.2864, "learning_rate": 0.0002, "epoch": 0.6, "step": 34 }, { "loss": 0.308, "learning_rate": 0.0002, "epoch": 0.61, "step": 35 }, { "loss": 0.2412, "learning_rate": 0.0002, "epoch": 0.63, "step": 36 }, { "loss": 0.4188, "learning_rate": 0.0002, "epoch": 0.65, "step": 37 }, { "loss": 0.3539, "learning_rate": 0.0002, "epoch": 0.67, "step": 38 }, { "loss": 0.4126, "learning_rate": 0.0002, "epoch": 0.68, "step": 39 }, { "loss": 0.2298, "learning_rate": 0.0002, "epoch": 0.7, "step": 40 }, { "loss": 0.1837, "learning_rate": 0.0002, "epoch": 0.72, "step": 41 }, { "loss": 0.2238, "learning_rate": 0.0002, "epoch": 0.74, "step": 42 }, { "loss": 0.3062, "learning_rate": 0.0002, "epoch": 0.75, "step": 43 }, { "loss": 0.3335, "learning_rate": 0.0002, "epoch": 0.77, "step": 44 }, { "loss": 0.128, "learning_rate": 0.0002, "epoch": 0.79, "step": 45 }, { "loss": 0.2156, "learning_rate": 0.0002, "epoch": 0.81, "step": 46 }, { "loss": 0.1373, "learning_rate": 0.0002, "epoch": 0.82, "step": 47 }, { "loss": 0.2333, "learning_rate": 0.0002, "epoch": 0.84, "step": 48 }, { "loss": 0.3292, "learning_rate": 0.0002, "epoch": 0.86, "step": 49 }, { "loss": 0.3278, "learning_rate": 0.0002, "epoch": 0.88, "step": 50 }, { "eval_comma_separated_input_loss": 0.447895348072052, "eval_comma_separated_input_score": -0.14565807580947876, "eval_comma_separated_input_brier_score": 0.14565807580947876, "eval_comma_separated_input_average_probability": 0.7761557102203369, "eval_comma_separated_input_accuracy": 0.77, "eval_comma_separated_input_probabilities": [ 0.4504460096359253, 0.7106965780258179, 0.7613977193832397, 0.27627503871917725, 0.1888580322265625, 0.36196234822273254, 0.9977447986602783, 0.9934731125831604, 0.9807383418083191, 0.9999233484268188, 0.9998125433921814, 0.9992616772651672, 0.42937251925468445, 0.35414958000183105, 0.3341814875602722, 0.9967638254165649, 0.9999350309371948, 0.9995962977409363, 0.9546691179275513, 0.9990658164024353, 0.99967360496521, 0.9045127034187317, 0.9956008195877075, 0.9143818020820618, 0.999998927116394, 0.9999983310699463, 0.999935507774353, 0.9908632636070251, 0.9999735355377197, 0.9989373087882996, 0.9830892086029053, 0.8966995477676392, 0.9865294694900513, 0.9999994039535522, 0.9999998807907104, 0.9999971389770508, 0.49074265360832214, 0.5514218211174011, 0.830772876739502, 0.9999492168426514, 0.8612533807754517, 0.9519673585891724, 0.9873406291007996, 0.8993487358093262, 0.8438679575920105, 0.9999995231628418, 0.9999996423721313, 0.9998364448547363, 0.999634861946106, 0.9831734299659729, 0.9952573180198669, 0.9982624650001526, 0.9984625577926636, 0.9621893167495728, 0.9999992847442627, 0.9999982118606567, 0.9999990463256836, 0.17832396924495697, 0.6987086534500122, 0.43089836835861206, 0.9999967813491821, 0.9999840259552002, 0.9999971389770508, 0.34186333417892456, 0.6733885407447815, 0.4354130029678345, 0.9825000762939453, 0.9815826416015625, 0.9878876209259033, 0.6807180047035217, 0.09687728434801102, 0.16909901797771454, 0.5602892637252808, 0.5863568186759949, 0.608674943447113, 0.9987614154815674, 0.997982382774353, 0.972231388092041, 0.02466653659939766, 0.0528080128133297, 0.2097661793231964, 0.9776371717453003, 0.5767873525619507, 0.9074500203132629, 0.9864820241928101, 0.5367009043693542, 0.9760178327560425, 0.06482303142547607, 0.1236090213060379, 0.1919964700937271, 0.3480866849422455, 0.38676121830940247, 0.15342266857624054, 0.9814541935920715, 0.9267071485519409, 0.9979047775268555, 0.9999786615371704, 0.9992477893829346, 0.9997554421424866, 0.9999927282333374 ], "eval_comma_separated_input_runtime": 78.026, "eval_comma_separated_input_samples_per_second": 1.282, "eval_comma_separated_input_steps_per_second": 0.051, "epoch": 0.88, "step": 50 }, { "loss": 0.1712, "learning_rate": 0.0002, "epoch": 0.89, "step": 51 }, { "loss": 0.1149, "learning_rate": 0.0002, "epoch": 0.91, "step": 52 }, { "loss": 0.1877, "learning_rate": 0.0002, "epoch": 0.93, "step": 53 }, { "loss": 0.0817, "learning_rate": 0.0002, "epoch": 0.95, "step": 54 }, { "loss": 0.0424, "learning_rate": 0.0002, "epoch": 0.96, "step": 55 }, { "loss": 0.2838, "learning_rate": 0.0002, "epoch": 0.98, "step": 56 }, { "loss": 0.1558, "learning_rate": 0.0002, "epoch": 1.0, "step": 57 }, { "loss": 0.0269, "learning_rate": 0.0002, "epoch": 1.02, "step": 58 }, { "loss": 0.0916, "learning_rate": 0.0002, "epoch": 1.04, "step": 59 }, { "loss": 0.0162, "learning_rate": 0.0002, "epoch": 1.05, "step": 60 }, { "loss": 0.0182, "learning_rate": 0.0002, "epoch": 1.07, "step": 61 }, { "loss": 0.0505, "learning_rate": 0.0002, "epoch": 1.09, "step": 62 }, { "loss": 0.1672, "learning_rate": 0.0002, "epoch": 1.11, "step": 63 }, { "loss": 0.0078, "learning_rate": 0.0002, "epoch": 1.12, "step": 64 }, { "loss": 0.0239, "learning_rate": 0.0002, "epoch": 1.14, "step": 65 }, { "loss": 0.0042, "learning_rate": 0.0002, "epoch": 1.16, "step": 66 }, { "loss": 0.1157, "learning_rate": 0.0002, "epoch": 1.18, "step": 67 }, { "loss": 0.0367, "learning_rate": 0.0002, "epoch": 1.19, "step": 68 }, { "loss": 0.0054, "learning_rate": 0.0002, "epoch": 1.21, "step": 69 }, { "loss": 0.3269, "learning_rate": 0.0002, "epoch": 1.23, "step": 70 }, { "loss": 0.0053, "learning_rate": 0.0002, "epoch": 1.25, "step": 71 }, { "loss": 0.0093, "learning_rate": 0.0002, "epoch": 1.26, "step": 72 }, { "loss": 0.06, "learning_rate": 0.0002, "epoch": 1.28, "step": 73 }, { "loss": 0.0214, "learning_rate": 0.0002, "epoch": 1.3, "step": 74 }, { "loss": 0.064, "learning_rate": 0.0002, "epoch": 1.32, "step": 75 }, { "eval_comma_separated_input_loss": 0.6194826364517212, "eval_comma_separated_input_score": -0.17542152106761932, "eval_comma_separated_input_brier_score": 0.17542152106761932, "eval_comma_separated_input_average_probability": 0.7849389910697937, "eval_comma_separated_input_accuracy"::0.77, "eval_comma_separated_input_probabilities": [ 0.3327490985393524, 0.9519062042236328, 0.9847831130027771, 0.5636963844299316, 0.031850676983594894, 0.05631185695528984, 0.9998056292533875, 0.9995859265327454, 0.990744411945343, 1.0, 1.0, 1.0, 0.9468281865119934, 0.8348178863525391, 0.23293766379356384, 0.9999988079071045, 1.0, 1.0, 0.9999995231628418, 1.0, 1.0, 0.9823529124259949, 0.9999111890792847, 0.9437704086303711, 1.0, 1.0, 0.9999995231628418, 0.9999985694885254, 1.0, 0.9999997615814209, 0.9999955892562866, 0.9999785423278809, 0.9999979734420776, 1.0, 1.0, 1.0, 0.15389743447303772, 0.8275808095932007, 0.9833057522773743, 1.0, 0.9276348948478699, 0.9925111532211304, 0.9999544620513916, 0.9182303547859192, 0.5098273158073425, 1.0, 1.0, 0.9999983310699463, 1.0, 0.9999970197677612, 0.9999997615814209, 0.9999984502792358, 0.9999997615814209, 0.9999309778213501, 1.0, 1.0, 1.0, 0.1305040717124939, 0.9028104543685913, 0.21933555603027344, 0.9999996423721313, 0.9999996423721313, 0.9999997615814209, 0.059167250990867615, 0.2488248497247696, 0.06632068753242493, 0.9999988079071045, 0.9999992847442627, 0.9999998807907104, 0.9473620057106018, 0.26638561487197876, 0.07780053466558456, 0.11167240887880325, 0.0027452881913632154, 0.3228246569633484, 0.9999821186065674, 0.999972939491272, 0.9944614171981812, 0.03967156261205673, 0.20487765967845917, 0.9539350271224976, 0.9898837208747864, 0.9399700164794922, 0.9973479509353638, 0.9999980926513672, 0.9816005229949951, 0.9999972581863403, 0.011794282123446465, 0.002413914306089282, 0.05205608159303665, 0.3445022404193878, 0.4484536349773407, 0.01951614022254944, 0.9997747540473938, 0.9940212368965149, 0.9999996423721313, 0.9999850988388062, 0.9991033673286438, 0.9999384880065918, 1.0 ], "eval_comma_separated_input_runtime": 78.0706, "eval_comma_separated_input_samples_per_second": 1.281, "eval_comma_separated_input_steps_per_second": 0.051, "epoch": 1.32, "step": 75 }, { "loss": 0.1843, "learning_rate": 0.0002, "epoch": 1.33, "step": 76 }, { "loss": 0.0102, "learning_rate": 0.0002, "epoch": 1.35, "step": 77 }, { "loss": 0.0016, "learning_rate": 0.0002, "epoch": 1.37, "step": 78 }, { "loss": 0.0847, "learning_rate": 0.0002, "epoch": 1.39, "step": 79 }, { "loss": 0.1682, "learning_rate": 0.0002, "epoch": 1.4, "step": 80 }, { "loss": 0.0202, "learning_rate": 0.0002, "epoch": 1.42, "step": 81 }, { "loss": 0.0717, "learning_rate": 0.0002, "epoch": 1.44, "step": 82 }, { "loss": 0.1845, "learning_rate": 0.0002, "epoch": 1.46, "step": 83 }, { "loss": 0.0604, "learning_rate": 0.0002, "epoch": 1.47, "step": 84 }, { "loss": 0.04, "learning_rate": 0.0002, "epoch": 1.49, "step": 85 }, { "loss": 0.1294, "learning_rate": 0.0002, "epoch": 1.51, "step": 86 }, { "loss": 0.0017, "learning_rate": 0.0002, "epoch": 1.53, "step": 87 }, { "loss": 0.0122, "learning_rate": 0.0002, "epoch": 1.54, "step": 88 }, { "loss": 0.1278, "learning_rate": 0.0002, "epoch": 1.56, "step": 89 }, { "loss": 0.0566, "learning_rate": 0.0002, "epoch": 1.58, "step": 90 }, { "loss": 0.0099, "learning_rate": 0.0002, "epoch": 1.6, "step": 91 }, { "loss": 0.0064, "learning_rate": 0.0002, "epoch": 1.61, "step": 92 }, { "loss": 0.0243, "learning_rate": 0.0002, "epoch": 1.63, "step": 93 }, { "loss": 0.0525, "learning_rate": 0.0002, "epoch": 1.65, "step": 94 }, { "loss": 0.0424, "learning_rate": 0.0002, "epoch": 1.67, "step": 95 }, { "loss": 0.0613, "learning_rate": 0.0002, "epoch": 1.68, "step": 96 }, { "loss": 0.0521, "learning_rate": 0.0002, "epoch": 1.7, "step": 97 }, { "loss": 0.0944, "learning_rate": 0.0002, "epoch": 1.72, "step": 98 }, { "loss": 0.0181, "learning_rate": 0.0002, "epoch": 1.74, "step": 99 }, { "loss": 0.0008, "learning_rate": 0.0002, "epoch": 1.75, "step": 100 }, { "eval_comma_separated_input_loss": 0.378570020198822, "eval_comma_separated_input_score": -0.10282441228628159, "eval_comma_separated_input_brier_score": 0.10282441228628159, "eval_comma_separated_input_average_probability": 0.8461194038391113, "eval_comma_separated_input_accuracy": 0.86, "eval_comma_separated_input_probabilities": [ 0.7394901514053345, 0.9556662440299988, 0.9631574153900146, 0.9448689818382263, 0.6851402521133423, 0.04673205316066742, 0.9999997615814209, 0.9999988079071045, 0.9999755620956421, 1.0, 1.0, 1.0, 0.8175366520881653, 0.5344929695129395, 0.40490445494651794, 0.9999028444290161, 0.9999998807907104, 0.9999815225601196, 0.9996824264526367, 0.9999032020568848, 0.9999306201934814, 0.9223772883415222, 0.9986610412597656, 0.9338085055351257, 1.0, 1.0, 0.9999598264694214, 0.9999997615814209, 1.0, 1.0, 0.9999829530715942, 0.9999233484268188, 0.9999957084655762, 1.0, 1.0, 1.0, 0.16704992949962616, 0.4352927505970001, 0.9530060291290283, 0.9999997615814209, 0.9648281931877136, 0.9776931405067444, 0.9999842643737793, 0.9146194458007812, 0.7172320485115051, 1.0, 0.9999998807907104, 0.9997580647468567, 1.0, 0.9999997615814209, 0.9999998807907104, 0.9999994039535522, 0.9999991655349731, 0.9998703002929688, 1.0, 1.0, 1.0, 0.43808406591415405, 0.5185633301734924, 0.47918856143951416, 1.0, 1.0, 1.0, 0.12787644565105438,, 0.8206732273101807, 0.6153414845466614, 0.9999388456344604, 0.9996930360794067, 0.9999504089355469, 0.9787357449531555, 0.20235727727413177, 0.06822255253791809, 0.8611693978309631, 0.46712806820869446, 0.9312974810600281, 1.0, 0.9999998807907104, 0.9988490343093872, 0.7939100861549377, 0.995577335357666, 0.995972216129303, 0.830564022064209, 0.9511353969573975, 0.9778002500534058, 0.9999828338623047, 0.9291109442710876, 0.9999287128448486, 0.007030226290225983, 0.002356813522055745, 0.04530631750822067, 0.569308340549469, 0.7886270880699158, 0.15891966223716736, 0.9987874627113342, 0.9973487854003906, 0.9999998807907104, 0.9999572038650513, 0.9878588318824768, 0.999981164932251, 1.0 ], "eval_comma_separated_input_runtime": 78.0074, "eval_comma_separated_input_samples_per_second": 1.282, "eval_comma_separated_input_steps_per_second": 0.051, "epoch": 1.75, "step": 100 }, { "train_runtime": 5582.1468, "train_samples_per_second": 0.573, "train_steps_per_second": 0.018, "total_flos": 0.0, "train_loss": 0.22866786144091747, "epoch": 1.75, "step": 100 } ]