Instructions to use genies-models/llama-30b-comma_separated_input with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use genies-models/llama-30b-comma_separated_input with PEFT:
from peft import PeftModel from transformers import AutoModelForSequenceClassification base_model = AutoModelForSequenceClassification.from_pretrained("models/llama-30b") model = PeftModel.from_pretrained(base_model, "genies-models/llama-30b-comma_separated_input") - Notebooks
- Google Colab
- Kaggle
Invalid JSON:Unexpected token ':', ..."accuracy"::0.77,
"... is not valid JSON
| [ | |
| { | |
| "loss": 0.7419, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.02, | |
| "step": 1 | |
| }, | |
| { | |
| "loss": 0.7104, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.04, | |
| "step": 2 | |
| }, | |
| { | |
| "loss": 0.6951, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.05, | |
| "step": 3 | |
| }, | |
| { | |
| "loss": 0.6797, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.07, | |
| "step": 4 | |
| }, | |
| { | |
| "loss": 0.6777, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.09, | |
| "step": 5 | |
| }, | |
| { | |
| "loss": 0.6727, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.11, | |
| "step": 6 | |
| }, | |
| { | |
| "loss": 0.6902, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.12, | |
| "step": 7 | |
| }, | |
| { | |
| "loss": 0.644, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.14, | |
| "step": 8 | |
| }, | |
| { | |
| "loss": 0.6332, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.16, | |
| "step": 9 | |
| }, | |
| { | |
| "loss": 0.6259, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.18, | |
| "step": 10 | |
| }, | |
| { | |
| "loss": 0.5662, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.19, | |
| "step": 11 | |
| }, | |
| { | |
| "loss": 0.4973, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.21, | |
| "step": 12 | |
| }, | |
| { | |
| "loss": 0.4677, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.23, | |
| "step": 13 | |
| }, | |
| { | |
| "loss": 0.3896, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.25, | |
| "step": 14 | |
| }, | |
| { | |
| "loss": 0.5832, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.26, | |
| "step": 15 | |
| }, | |
| { | |
| "loss": 0.2747, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.28, | |
| "step": 16 | |
| }, | |
| { | |
| "loss": 0.3438, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.3, | |
| "step": 17 | |
| }, | |
| { | |
| "loss": 0.2304, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.32, | |
| "step": 18 | |
| }, | |
| { | |
| "loss": 0.2208, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.33, | |
| "step": 19 | |
| }, | |
| { | |
| "loss": 0.3179, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.35, | |
| "step": 20 | |
| }, | |
| { | |
| "loss": 0.3831, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.37, | |
| "step": 21 | |
| }, | |
| { | |
| "loss": 0.3274, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.39, | |
| "step": 22 | |
| }, | |
| { | |
| "loss": 0.3322, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.4, | |
| "step": 23 | |
| }, | |
| { | |
| "loss": 0.1843, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.42, | |
| "step": 24 | |
| }, | |
| { | |
| "loss": 0.3792, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.44, | |
| "step": 25 | |
| }, | |
| { | |
| "eval_comma_separated_input_loss": 0.47381076216697693, | |
| "eval_comma_separated_input_score": -0.14903230965137482, | |
| "eval_comma_separated_input_brier_score": 0.14903230965137482, | |
| "eval_comma_separated_input_average_probability": 0.739839494228363, | |
| "eval_comma_separated_input_accuracy": 0.76, | |
| "eval_comma_separated_input_probabilities": [ | |
| 0.5057103037834167, | |
| 0.7926411032676697, | |
| 0.8395572304725647, | |
| 0.8750540614128113, | |
| 0.6638176441192627, | |
| 0.3412554860115051, | |
| 0.8521225452423096, | |
| 0.7427878975868225, | |
| 0.48845282196998596, | |
| 0.9979581832885742, | |
| 0.9965298771858215, | |
| 0.9844328165054321, | |
| 0.4072255790233612, | |
| 0.4754917323589325, | |
| 0.2266879379749298, | |
| 0.9544909000396729, | |
| 0.9932397603988647, | |
| 0.9822323322296143, | |
| 0.9549546241760254, | |
| 0.9956372380256653, | |
| 0.8111849427223206, | |
| 0.6678183674812317, | |
| 0.9605175256729126, | |
| 0.6721541285514832, | |
| 0.9995113611221313, | |
| 0.9995362758636475, | |
| 0.9969425797462463, | |
| 0.7482375502586365, | |
| 0.978789746761322, | |
| 0.9411532282829285, | |
| 0.8092716336250305, | |
| 0.5804548263549805, | |
| 0.8987478613853455, | |
| 0.9926584362983704, | |
| 0.9968037605285645, | |
| 0.9899746775627136, | |
| 0.5884284973144531, | |
| 0.6909584999084473, | |
| 0.7130376100540161, | |
| 0.984264612197876, | |
| 0.8204785585403442, | |
| 0.6899394392967224, | |
| 0.7373196482658386, | |
| 0.5578603148460388, | |
| 0.4814424216747284, | |
| 0.9995312690734863, | |
| 0.9998726844787598, | |
| 0.9916493892669678, | |
| 0.9987574815750122, | |
| 0.8930770754814148, | |
| 0.9631037712097168, | |
| 0.9723063707351685, | |
| 0.867325484752655, | |
| 0.8623606562614441, | |
| 0.9999880790710449, | |
| 0.9999451637268066, | |
| 0.999957799911499, | |
| 0.3165142834186554, | |
| 0.5785897970199585, | |
| 0.4601801335811615, | |
| 0.9999808073043823, | |
| 0.9999685287475586, | |
| 0.9999656677246094, | |
| 0.3123607933521271, | |
| 0.3744247555732727, | |
| 0.27252867817878723, | |
| 0.9987949132919312, | |
| 0.9992828965187073, | |
| 0.9993246793746948, | |
| 0.5784086585044861, | |
| 0.15536504983901978, | |
| 0.23488140106201172, | |
| 0.14060163497924805, | |
| 0.11246518045663834, | |
| 0.3872424066066742, | |
| 0.9960883855819702, | |
| 0.9901509284973145, | |
| 0.9042060375213623, | |
| 0.010595398023724556, | |
| 0.019154399633407593, | |
| 0.10093849897384644, | |
| 0.6121878623962402, | |
| 0.4093835949897766, | |
| 0.6347980499267578, | |
| 0.992620050907135, | |
| 0.7581243515014648, | |
| 0.9930395483970642, | |
| 0.374697744846344, | |
| 0.3880426585674286, | |
| 0.37667402625083923, | |
| 0.751455545425415, | |
| 0.6910660862922668, | |
| 0.4043519198894501, | |
| 0.9727478623390198, | |
| 0.9151681661605835, | |
| 0.9926292896270752, | |
| 0.9967435598373413, | |
| 0.8987772464752197, | |
| 0.9539257884025574, | |
| 0.9998562335968018 | |
| ], | |
| "eval_comma_separated_input_runtime": 78.0564, | |
| "eval_comma_separated_input_samples_per_second": 1.281, | |
| "eval_comma_separated_input_steps_per_second": 0.051, | |
| "epoch": 0.44, | |
| "step": 25 | |
| }, | |
| { | |
| "loss": 0.326, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.46, | |
| "step": 26 | |
| }, | |
| { | |
| "loss": 0.5505, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.47, | |
| "step": 27 | |
| }, | |
| { | |
| "loss": 0.254, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.49, | |
| "step": 28 | |
| }, | |
| { | |
| "loss": 0.3024, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.51, | |
| "step": 29 | |
| }, | |
| { | |
| "loss": 0.1145, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.53, | |
| "step": 30 | |
| }, | |
| { | |
| "loss": 0.2487, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.54, | |
| "step": 31 | |
| }, | |
| { | |
| "loss": 0.2536, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.56, | |
| "step": 32 | |
| }, | |
| { | |
| "loss": 0.2752, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.58, | |
| "step": 33 | |
| }, | |
| { | |
| "loss": 0.2864, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.6, | |
| "step": 34 | |
| }, | |
| { | |
| "loss": 0.308, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.61, | |
| "step": 35 | |
| }, | |
| { | |
| "loss": 0.2412, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.63, | |
| "step": 36 | |
| }, | |
| { | |
| "loss": 0.4188, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.65, | |
| "step": 37 | |
| }, | |
| { | |
| "loss": 0.3539, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.67, | |
| "step": 38 | |
| }, | |
| { | |
| "loss": 0.4126, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.68, | |
| "step": 39 | |
| }, | |
| { | |
| "loss": 0.2298, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.7, | |
| "step": 40 | |
| }, | |
| { | |
| "loss": 0.1837, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.72, | |
| "step": 41 | |
| }, | |
| { | |
| "loss": 0.2238, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.74, | |
| "step": 42 | |
| }, | |
| { | |
| "loss": 0.3062, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.75, | |
| "step": 43 | |
| }, | |
| { | |
| "loss": 0.3335, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.77, | |
| "step": 44 | |
| }, | |
| { | |
| "loss": 0.128, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.79, | |
| "step": 45 | |
| }, | |
| { | |
| "loss": 0.2156, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.81, | |
| "step": 46 | |
| }, | |
| { | |
| "loss": 0.1373, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.82, | |
| "step": 47 | |
| }, | |
| { | |
| "loss": 0.2333, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.84, | |
| "step": 48 | |
| }, | |
| { | |
| "loss": 0.3292, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.86, | |
| "step": 49 | |
| }, | |
| { | |
| "loss": 0.3278, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.88, | |
| "step": 50 | |
| }, | |
| { | |
| "eval_comma_separated_input_loss": 0.447895348072052, | |
| "eval_comma_separated_input_score": -0.14565807580947876, | |
| "eval_comma_separated_input_brier_score": 0.14565807580947876, | |
| "eval_comma_separated_input_average_probability": 0.7761557102203369, | |
| "eval_comma_separated_input_accuracy": 0.77, | |
| "eval_comma_separated_input_probabilities": [ | |
| 0.4504460096359253, | |
| 0.7106965780258179, | |
| 0.7613977193832397, | |
| 0.27627503871917725, | |
| 0.1888580322265625, | |
| 0.36196234822273254, | |
| 0.9977447986602783, | |
| 0.9934731125831604, | |
| 0.9807383418083191, | |
| 0.9999233484268188, | |
| 0.9998125433921814, | |
| 0.9992616772651672, | |
| 0.42937251925468445, | |
| 0.35414958000183105, | |
| 0.3341814875602722, | |
| 0.9967638254165649, | |
| 0.9999350309371948, | |
| 0.9995962977409363, | |
| 0.9546691179275513, | |
| 0.9990658164024353, | |
| 0.99967360496521, | |
| 0.9045127034187317, | |
| 0.9956008195877075, | |
| 0.9143818020820618, | |
| 0.999998927116394, | |
| 0.9999983310699463, | |
| 0.999935507774353, | |
| 0.9908632636070251, | |
| 0.9999735355377197, | |
| 0.9989373087882996, | |
| 0.9830892086029053, | |
| 0.8966995477676392, | |
| 0.9865294694900513, | |
| 0.9999994039535522, | |
| 0.9999998807907104, | |
| 0.9999971389770508, | |
| 0.49074265360832214, | |
| 0.5514218211174011, | |
| 0.830772876739502, | |
| 0.9999492168426514, | |
| 0.8612533807754517, | |
| 0.9519673585891724, | |
| 0.9873406291007996, | |
| 0.8993487358093262, | |
| 0.8438679575920105, | |
| 0.9999995231628418, | |
| 0.9999996423721313, | |
| 0.9998364448547363, | |
| 0.999634861946106, | |
| 0.9831734299659729, | |
| 0.9952573180198669, | |
| 0.9982624650001526, | |
| 0.9984625577926636, | |
| 0.9621893167495728, | |
| 0.9999992847442627, | |
| 0.9999982118606567, | |
| 0.9999990463256836, | |
| 0.17832396924495697, | |
| 0.6987086534500122, | |
| 0.43089836835861206, | |
| 0.9999967813491821, | |
| 0.9999840259552002, | |
| 0.9999971389770508, | |
| 0.34186333417892456, | |
| 0.6733885407447815, | |
| 0.4354130029678345, | |
| 0.9825000762939453, | |
| 0.9815826416015625, | |
| 0.9878876209259033, | |
| 0.6807180047035217, | |
| 0.09687728434801102, | |
| 0.16909901797771454, | |
| 0.5602892637252808, | |
| 0.5863568186759949, | |
| 0.608674943447113, | |
| 0.9987614154815674, | |
| 0.997982382774353, | |
| 0.972231388092041, | |
| 0.02466653659939766, | |
| 0.0528080128133297, | |
| 0.2097661793231964, | |
| 0.9776371717453003, | |
| 0.5767873525619507, | |
| 0.9074500203132629, | |
| 0.9864820241928101, | |
| 0.5367009043693542, | |
| 0.9760178327560425, | |
| 0.06482303142547607, | |
| 0.1236090213060379, | |
| 0.1919964700937271, | |
| 0.3480866849422455, | |
| 0.38676121830940247, | |
| 0.15342266857624054, | |
| 0.9814541935920715, | |
| 0.9267071485519409, | |
| 0.9979047775268555, | |
| 0.9999786615371704, | |
| 0.9992477893829346, | |
| 0.9997554421424866, | |
| 0.9999927282333374 | |
| ], | |
| "eval_comma_separated_input_runtime": 78.026, | |
| "eval_comma_separated_input_samples_per_second": 1.282, | |
| "eval_comma_separated_input_steps_per_second": 0.051, | |
| "epoch": 0.88, | |
| "step": 50 | |
| }, | |
| { | |
| "loss": 0.1712, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.89, | |
| "step": 51 | |
| }, | |
| { | |
| "loss": 0.1149, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.91, | |
| "step": 52 | |
| }, | |
| { | |
| "loss": 0.1877, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.93, | |
| "step": 53 | |
| }, | |
| { | |
| "loss": 0.0817, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.95, | |
| "step": 54 | |
| }, | |
| { | |
| "loss": 0.0424, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.96, | |
| "step": 55 | |
| }, | |
| { | |
| "loss": 0.2838, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.98, | |
| "step": 56 | |
| }, | |
| { | |
| "loss": 0.1558, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.0, | |
| "step": 57 | |
| }, | |
| { | |
| "loss": 0.0269, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.02, | |
| "step": 58 | |
| }, | |
| { | |
| "loss": 0.0916, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.04, | |
| "step": 59 | |
| }, | |
| { | |
| "loss": 0.0162, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.05, | |
| "step": 60 | |
| }, | |
| { | |
| "loss": 0.0182, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.07, | |
| "step": 61 | |
| }, | |
| { | |
| "loss": 0.0505, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.09, | |
| "step": 62 | |
| }, | |
| { | |
| "loss": 0.1672, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.11, | |
| "step": 63 | |
| }, | |
| { | |
| "loss": 0.0078, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.12, | |
| "step": 64 | |
| }, | |
| { | |
| "loss": 0.0239, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.14, | |
| "step": 65 | |
| }, | |
| { | |
| "loss": 0.0042, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.16, | |
| "step": 66 | |
| }, | |
| { | |
| "loss": 0.1157, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.18, | |
| "step": 67 | |
| }, | |
| { | |
| "loss": 0.0367, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.19, | |
| "step": 68 | |
| }, | |
| { | |
| "loss": 0.0054, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.21, | |
| "step": 69 | |
| }, | |
| { | |
| "loss": 0.3269, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.23, | |
| "step": 70 | |
| }, | |
| { | |
| "loss": 0.0053, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.25, | |
| "step": 71 | |
| }, | |
| { | |
| "loss": 0.0093, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.26, | |
| "step": 72 | |
| }, | |
| { | |
| "loss": 0.06, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.28, | |
| "step": 73 | |
| }, | |
| { | |
| "loss": 0.0214, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.3, | |
| "step": 74 | |
| }, | |
| { | |
| "loss": 0.064, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.32, | |
| "step": 75 | |
| }, | |
| { | |
| "eval_comma_separated_input_loss": 0.6194826364517212, | |
| "eval_comma_separated_input_score": -0.17542152106761932, | |
| "eval_comma_separated_input_brier_score": 0.17542152106761932, | |
| "eval_comma_separated_input_average_probability": 0.7849389910697937, | |
| "eval_comma_separated_input_accuracy"::0.77, | |
| "eval_comma_separated_input_probabilities": [ | |
| 0.3327490985393524, | |
| 0.9519062042236328, | |
| 0.9847831130027771, | |
| 0.5636963844299316, | |
| 0.031850676983594894, | |
| 0.05631185695528984, | |
| 0.9998056292533875, | |
| 0.9995859265327454, | |
| 0.990744411945343, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9468281865119934, | |
| 0.8348178863525391, | |
| 0.23293766379356384, | |
| 0.9999988079071045, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 0.9823529124259949, | |
| 0.9999111890792847, | |
| 0.9437704086303711, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 0.9999985694885254, | |
| 1.0, | |
| 0.9999997615814209, | |
| 0.9999955892562866, | |
| 0.9999785423278809, | |
| 0.9999979734420776, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.15389743447303772, | |
| 0.8275808095932007, | |
| 0.9833057522773743, | |
| 1.0, | |
| 0.9276348948478699, | |
| 0.9925111532211304, | |
| 0.9999544620513916, | |
| 0.9182303547859192, | |
| 0.5098273158073425, | |
| 1.0, | |
| 1.0, | |
| 0.9999983310699463, | |
| 1.0, | |
| 0.9999970197677612, | |
| 0.9999997615814209, | |
| 0.9999984502792358, | |
| 0.9999997615814209, | |
| 0.9999309778213501, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.1305040717124939, | |
| 0.9028104543685913, | |
| 0.21933555603027344, | |
| 0.9999996423721313, | |
| 0.9999996423721313, | |
| 0.9999997615814209, | |
| 0.059167250990867615, | |
| 0.2488248497247696, | |
| 0.06632068753242493, | |
| 0.9999988079071045, | |
| 0.9999992847442627, | |
| 0.9999998807907104, | |
| 0.9473620057106018, | |
| 0.26638561487197876, | |
| 0.07780053466558456, | |
| 0.11167240887880325, | |
| 0.0027452881913632154, | |
| 0.3228246569633484, | |
| 0.9999821186065674, | |
| 0.999972939491272, | |
| 0.9944614171981812, | |
| 0.03967156261205673, | |
| 0.20487765967845917, | |
| 0.9539350271224976, | |
| 0.9898837208747864, | |
| 0.9399700164794922, | |
| 0.9973479509353638, | |
| 0.9999980926513672, | |
| 0.9816005229949951, | |
| 0.9999972581863403, | |
| 0.011794282123446465, | |
| 0.002413914306089282, | |
| 0.05205608159303665, | |
| 0.3445022404193878, | |
| 0.4484536349773407, | |
| 0.01951614022254944, | |
| 0.9997747540473938, | |
| 0.9940212368965149, | |
| 0.9999996423721313, | |
| 0.9999850988388062, | |
| 0.9991033673286438, | |
| 0.9999384880065918, | |
| 1.0 | |
| ], | |
| "eval_comma_separated_input_runtime": 78.0706, | |
| "eval_comma_separated_input_samples_per_second": 1.281, | |
| "eval_comma_separated_input_steps_per_second": 0.051, | |
| "epoch": 1.32, | |
| "step": 75 | |
| }, | |
| { | |
| "loss": 0.1843, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.33, | |
| "step": 76 | |
| }, | |
| { | |
| "loss": 0.0102, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.35, | |
| "step": 77 | |
| }, | |
| { | |
| "loss": 0.0016, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.37, | |
| "step": 78 | |
| }, | |
| { | |
| "loss": 0.0847, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.39, | |
| "step": 79 | |
| }, | |
| { | |
| "loss": 0.1682, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.4, | |
| "step": 80 | |
| }, | |
| { | |
| "loss": 0.0202, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.42, | |
| "step": 81 | |
| }, | |
| { | |
| "loss": 0.0717, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.44, | |
| "step": 82 | |
| }, | |
| { | |
| "loss": 0.1845, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.46, | |
| "step": 83 | |
| }, | |
| { | |
| "loss": 0.0604, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.47, | |
| "step": 84 | |
| }, | |
| { | |
| "loss": 0.04, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.49, | |
| "step": 85 | |
| }, | |
| { | |
| "loss": 0.1294, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.51, | |
| "step": 86 | |
| }, | |
| { | |
| "loss": 0.0017, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.53, | |
| "step": 87 | |
| }, | |
| { | |
| "loss": 0.0122, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.54, | |
| "step": 88 | |
| }, | |
| { | |
| "loss": 0.1278, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.56, | |
| "step": 89 | |
| }, | |
| { | |
| "loss": 0.0566, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.58, | |
| "step": 90 | |
| }, | |
| { | |
| "loss": 0.0099, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.6, | |
| "step": 91 | |
| }, | |
| { | |
| "loss": 0.0064, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.61, | |
| "step": 92 | |
| }, | |
| { | |
| "loss": 0.0243, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.63, | |
| "step": 93 | |
| }, | |
| { | |
| "loss": 0.0525, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.65, | |
| "step": 94 | |
| }, | |
| { | |
| "loss": 0.0424, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.67, | |
| "step": 95 | |
| }, | |
| { | |
| "loss": 0.0613, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.68, | |
| "step": 96 | |
| }, | |
| { | |
| "loss": 0.0521, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.7, | |
| "step": 97 | |
| }, | |
| { | |
| "loss": 0.0944, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.72, | |
| "step": 98 | |
| }, | |
| { | |
| "loss": 0.0181, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.74, | |
| "step": 99 | |
| }, | |
| { | |
| "loss": 0.0008, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.75, | |
| "step": 100 | |
| }, | |
| { | |
| "eval_comma_separated_input_loss": 0.378570020198822, | |
| "eval_comma_separated_input_score": -0.10282441228628159, | |
| "eval_comma_separated_input_brier_score": 0.10282441228628159, | |
| "eval_comma_separated_input_average_probability": 0.8461194038391113, | |
| "eval_comma_separated_input_accuracy": 0.86, | |
| "eval_comma_separated_input_probabilities": [ | |
| 0.7394901514053345, | |
| 0.9556662440299988, | |
| 0.9631574153900146, | |
| 0.9448689818382263, | |
| 0.6851402521133423, | |
| 0.04673205316066742, | |
| 0.9999997615814209, | |
| 0.9999988079071045, | |
| 0.9999755620956421, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.8175366520881653, | |
| 0.5344929695129395, | |
| 0.40490445494651794, | |
| 0.9999028444290161, | |
| 0.9999998807907104, | |
| 0.9999815225601196, | |
| 0.9996824264526367, | |
| 0.9999032020568848, | |
| 0.9999306201934814, | |
| 0.9223772883415222, | |
| 0.9986610412597656, | |
| 0.9338085055351257, | |
| 1.0, | |
| 1.0, | |
| 0.9999598264694214, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 0.9999829530715942, | |
| 0.9999233484268188, | |
| 0.9999957084655762, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.16704992949962616, | |
| 0.4352927505970001, | |
| 0.9530060291290283, | |
| 0.9999997615814209, | |
| 0.9648281931877136, | |
| 0.9776931405067444, | |
| 0.9999842643737793, | |
| 0.9146194458007812, | |
| 0.7172320485115051, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9997580647468567, | |
| 1.0, | |
| 0.9999997615814209, | |
| 0.9999998807907104, | |
| 0.9999994039535522, | |
| 0.9999991655349731, | |
| 0.9998703002929688, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.43808406591415405, | |
| 0.5185633301734924, | |
| 0.47918856143951416, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.12787644565105438,, | |
| 0.8206732273101807, | |
| 0.6153414845466614, | |
| 0.9999388456344604, | |
| 0.9996930360794067, | |
| 0.9999504089355469, | |
| 0.9787357449531555, | |
| 0.20235727727413177, | |
| 0.06822255253791809, | |
| 0.8611693978309631, | |
| 0.46712806820869446, | |
| 0.9312974810600281, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9988490343093872, | |
| 0.7939100861549377, | |
| 0.995577335357666, | |
| 0.995972216129303, | |
| 0.830564022064209, | |
| 0.9511353969573975, | |
| 0.9778002500534058, | |
| 0.9999828338623047, | |
| 0.9291109442710876, | |
| 0.9999287128448486, | |
| 0.007030226290225983, | |
| 0.002356813522055745, | |
| 0.04530631750822067, | |
| 0.569308340549469, | |
| 0.7886270880699158, | |
| 0.15891966223716736, | |
| 0.9987874627113342, | |
| 0.9973487854003906, | |
| 0.9999998807907104, | |
| 0.9999572038650513, | |
| 0.9878588318824768, | |
| 0.999981164932251, | |
| 1.0 | |
| ], | |
| "eval_comma_separated_input_runtime": 78.0074, | |
| "eval_comma_separated_input_samples_per_second": 1.282, | |
| "eval_comma_separated_input_steps_per_second": 0.051, | |
| "epoch": 1.75, | |
| "step": 100 | |
| }, | |
| { | |
| "train_runtime": 5582.1468, | |
| "train_samples_per_second": 0.573, | |
| "train_steps_per_second": 0.018, | |
| "total_flos": 0.0, | |
| "train_loss": 0.22866786144091747, | |
| "epoch": 1.75, | |
| "step": 100 | |
| } | |
| ] |