Instructions to use genies-models/llama-30b-code_low_quality with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use genies-models/llama-30b-code_low_quality with PEFT:
from peft import PeftModel from transformers import AutoModelForSequenceClassification base_model = AutoModelForSequenceClassification.from_pretrained("models/llama-30b") model = PeftModel.from_pretrained(base_model, "genies-models/llama-30b-code_low_quality") - Notebooks
- Google Colab
- Kaggle
| [ | |
| { | |
| "loss": 0.7435, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.03, | |
| "step": 1 | |
| }, | |
| { | |
| "loss": 0.5463, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.05, | |
| "step": 2 | |
| }, | |
| { | |
| "loss": 0.4573, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.08, | |
| "step": 3 | |
| }, | |
| { | |
| "loss": 0.3088, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.11, | |
| "step": 4 | |
| }, | |
| { | |
| "loss": 0.2566, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.13, | |
| "step": 5 | |
| }, | |
| { | |
| "loss": 0.235, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.16, | |
| "step": 6 | |
| }, | |
| { | |
| "loss": 0.113, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.18, | |
| "step": 7 | |
| }, | |
| { | |
| "loss": 0.1435, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.21, | |
| "step": 8 | |
| }, | |
| { | |
| "loss": 0.1263, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.24, | |
| "step": 9 | |
| }, | |
| { | |
| "loss": 0.0532, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.26, | |
| "step": 10 | |
| }, | |
| { | |
| "loss": 0.0326, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.29, | |
| "step": 11 | |
| }, | |
| { | |
| "loss": 0.0732, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.32, | |
| "step": 12 | |
| }, | |
| { | |
| "loss": 0.0714, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.34, | |
| "step": 13 | |
| }, | |
| { | |
| "loss": 0.01, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.37, | |
| "step": 14 | |
| }, | |
| { | |
| "loss": 0.4883, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.39, | |
| "step": 15 | |
| }, | |
| { | |
| "loss": 0.0547, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.42, | |
| "step": 16 | |
| }, | |
| { | |
| "loss": 0.0418, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.45, | |
| "step": 17 | |
| }, | |
| { | |
| "loss": 0.0242, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.47, | |
| "step": 18 | |
| }, | |
| { | |
| "loss": 0.1662, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.5, | |
| "step": 19 | |
| }, | |
| { | |
| "loss": 0.0201, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.53, | |
| "step": 20 | |
| }, | |
| { | |
| "loss": 0.0896, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.55, | |
| "step": 21 | |
| }, | |
| { | |
| "loss": 0.0298, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.58, | |
| "step": 22 | |
| }, | |
| { | |
| "loss": 0.0283, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.61, | |
| "step": 23 | |
| }, | |
| { | |
| "loss": 0.0214, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.63, | |
| "step": 24 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.66, | |
| "step": 25 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.0006595517043024302, | |
| "eval_code_low_quality_score": -1.1128052392450627e-05, | |
| "eval_code_low_quality_brier_score": 1.1128052392450627e-05, | |
| "eval_code_low_quality_average_probability": 0.9993544220924377, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 0.9999339580535889, | |
| 0.9999250173568726, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 0.9999914169311523, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 0.9999932050704956, | |
| 0.9999402761459351, | |
| 0.9999994039535522, | |
| 0.9999994039535522, | |
| 0.9999964237213135, | |
| 0.9999980926513672, | |
| 0.9999585151672363, | |
| 0.9999517202377319, | |
| 0.9974417686462402, | |
| 0.9972801208496094, | |
| 0.9999949932098389, | |
| 0.9999983310699463, | |
| 1.0, | |
| 1.0, | |
| 0.9707977771759033, | |
| 0.9999984502792358, | |
| 0.9999997615814209, | |
| 0.9999998807907104, | |
| 0.9999961853027344, | |
| 0.9999938011169434, | |
| 0.9999990463256836, | |
| 0.9999834299087524, | |
| 0.9982851147651672, | |
| 0.9977701902389526, | |
| 0.9946922659873962, | |
| 0.9993091821670532, | |
| 0.9999990463256836, | |
| 0.9999549388885498, | |
| 0.9999979734420776, | |
| 1.0, | |
| 0.9999107122421265, | |
| 0.9998675584793091, | |
| 0.999998927116394, | |
| 0.9999998807907104, | |
| 0.9999997615814209, | |
| 1.0, | |
| 0.9999986886978149, | |
| 0.9999995231628418, | |
| 0.9999984502792358, | |
| 0.999998927116394, | |
| 1.0, | |
| 1.0, | |
| 0.9999972581863403, | |
| 0.9999957084655762, | |
| 0.9999988079071045, | |
| 0.9999986886978149, | |
| 0.9999998807907104, | |
| 0.9999723434448242, | |
| 0.9999982118606567, | |
| 0.9999983310699463, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999990463256836, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999997615814209, | |
| 0.9999998807907104, | |
| 0.9999725818634033, | |
| 0.9999992847442627, | |
| 0.9999661445617676, | |
| 0.999969482421875, | |
| 0.9999997615814209, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9960858821868896, | |
| 0.9996801614761353, | |
| 0.9999926090240479, | |
| 0.9999170303344727, | |
| 0.9999935626983643, | |
| 0.9999808073043823, | |
| 0.9999854564666748, | |
| 0.9861019849777222, | |
| 0.9998243451118469, | |
| 0.9990695118904114, | |
| 0.9999963045120239, | |
| 0.9999998807907104, | |
| 0.9999969005584717, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 141.0153, | |
| "eval_code_low_quality_samples_per_second": 0.709, | |
| "eval_code_low_quality_steps_per_second": 0.028, | |
| "epoch": 0.66, | |
| "step": 25 | |
| }, | |
| { | |
| "eval_code_loss": 0.5833292603492737, | |
| "eval_code_score": -0.1804097294807434, | |
| "eval_code_brier_score": 0.1804097294807434, | |
| "eval_code_average_probability": 0.6770716309547424, | |
| "eval_code_accuracy": 0.76, | |
| "eval_code_probabilities": [ | |
| 0.10096369683742523, | |
| 0.21281138062477112, | |
| 0.2073233723640442, | |
| 0.9848010540008545, | |
| 0.9974289536476135, | |
| 0.7294337749481201, | |
| 0.6149591207504272, | |
| 0.10706400871276855, | |
| 0.5733828544616699, | |
| 0.6794034242630005, | |
| 0.9404621124267578, | |
| 0.8340038061141968, | |
| 0.8182052969932556, | |
| 0.9913336634635925, | |
| 0.8865165710449219, | |
| 0.473355770111084, | |
| 0.44256484508514404, | |
| 0.44847366213798523, | |
| 0.9831279516220093, | |
| 0.9921797513961792, | |
| 0.9801183938980103, | |
| 0.5592747330665588, | |
| 0.836647093296051, | |
| 0.8669078946113586, | |
| 0.017949247732758522, | |
| 0.02475733682513237, | |
| 0.025172699242830276, | |
| 0.9788206815719604, | |
| 0.9780603051185608, | |
| 0.9747424125671387, | |
| 0.4794495105743408, | |
| 0.978365421295166, | |
| 0.7862324714660645, | |
| 0.19819535315036774, | |
| 0.08767852187156677, | |
| 0.06654077768325806, | |
| 0.8256481885910034, | |
| 0.9054414629936218, | |
| 0.698613166809082, | |
| 0.9710825085639954, | |
| 0.9051369428634644, | |
| 0.9175053238868713, | |
| 0.5884507298469543, | |
| 0.6432308554649353, | |
| 0.5494475960731506, | |
| 0.6364181041717529, | |
| 0.985031008720398, | |
| 0.934455394744873, | |
| 0.5507091879844666, | |
| 0.41536206007003784, | |
| 0.9477699995040894, | |
| 0.9997536540031433, | |
| 0.9998169541358948, | |
| 0.9843502044677734, | |
| 0.5441336631774902, | |
| 0.5056722164154053, | |
| 0.45167604088783264, | |
| 0.4324477016925812, | |
| 0.46727290749549866, | |
| 0.4145377576351166, | |
| 0.7619684934616089, | |
| 0.5765150785446167, | |
| 0.6369282007217407, | |
| 0.8258550763130188, | |
| 0.5172879695892334, | |
| 0.4960772395133972, | |
| 0.9996997117996216, | |
| 0.7111136317253113, | |
| 0.681095540523529, | |
| 0.7522112727165222, | |
| 0.7496448755264282, | |
| 0.7440780997276306, | |
| 0.5330413579940796, | |
| 0.5731443166732788, | |
| 0.5385348796844482, | |
| 0.9997851252555847, | |
| 0.9988688826560974, | |
| 0.9994134902954102, | |
| 0.991698145866394, | |
| 0.7425008416175842, | |
| 0.7211678624153137, | |
| 0.9967381358146667, | |
| 0.5310153365135193, | |
| 0.997730553150177, | |
| 0.7988360524177551, | |
| 0.7310686707496643, | |
| 0.9935532808303833, | |
| 0.9999699592590332, | |
| 0.9999909400939941, | |
| 0.9834601283073425, | |
| 0.5250475406646729, | |
| 0.5600137114524841, | |
| 0.5266534090042114, | |
| 0.48367124795913696, | |
| 0.5329293608665466, | |
| 0.5332629084587097, | |
| 0.6026731729507446, | |
| 0.34615248441696167, | |
| 0.3938570022583008, | |
| 0.4892289638519287 | |
| ], | |
| "eval_code_runtime": 134.9932, | |
| "eval_code_samples_per_second": 0.741, | |
| "eval_code_steps_per_second": 0.03, | |
| "epoch": 0.66, | |
| "step": 25 | |
| }, | |
| { | |
| "loss": 0.0016, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.68, | |
| "step": 26 | |
| }, | |
| { | |
| "loss": 0.0076, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.71, | |
| "step": 27 | |
| }, | |
| { | |
| "loss": 0.0014, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.74, | |
| "step": 28 | |
| }, | |
| { | |
| "loss": 0.0359, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.76, | |
| "step": 29 | |
| }, | |
| { | |
| "loss": 0.0008, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.79, | |
| "step": 30 | |
| }, | |
| { | |
| "loss": 0.0076, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.82, | |
| "step": 31 | |
| }, | |
| { | |
| "loss": 0.001, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.84, | |
| "step": 32 | |
| }, | |
| { | |
| "loss": 0.0458, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.87, | |
| "step": 33 | |
| }, | |
| { | |
| "loss": 0.0017, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.89, | |
| "step": 34 | |
| }, | |
| { | |
| "loss": 0.0328, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.92, | |
| "step": 35 | |
| }, | |
| { | |
| "loss": 0.0102, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.95, | |
| "step": 36 | |
| }, | |
| { | |
| "loss": 0.0025, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.97, | |
| "step": 37 | |
| }, | |
| { | |
| "loss": 0.0124, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.0, | |
| "step": 38 | |
| }, | |
| { | |
| "loss": 0.0019, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.03, | |
| "step": 39 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.05, | |
| "step": 40 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.08, | |
| "step": 41 | |
| }, | |
| { | |
| "loss": 0.0182, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.11, | |
| "step": 42 | |
| }, | |
| { | |
| "loss": 0.0033, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.13, | |
| "step": 43 | |
| }, | |
| { | |
| "loss": 0.0005, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.16, | |
| "step": 44 | |
| }, | |
| { | |
| "loss": 0.2313, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.18, | |
| "step": 45 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.21, | |
| "step": 46 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.24, | |
| "step": 47 | |
| }, | |
| { | |
| "loss": 0.0007, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.26, | |
| "step": 48 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.29, | |
| "step": 49 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.32, | |
| "step": 50 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 9.984543430618942e-05, | |
| "eval_code_low_quality_score": -4.904638899461133e-07, | |
| "eval_code_low_quality_brier_score": 4.904638899461133e-07, | |
| "eval_code_low_quality_average_probability": 0.9999052286148071, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999854564666748, | |
| 0.999990701675415, | |
| 0.9999991655349731, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 0.9997785687446594, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9999037981033325, | |
| 0.999776303768158, | |
| 0.9996434450149536, | |
| 0.9999954700469971, | |
| 1.0, | |
| 1.0, | |
| 0.9931026697158813, | |
| 1.0, | |
| 0.9999970197677612, | |
| 0.9999984502792358, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.999966025352478, | |
| 0.9999886751174927, | |
| 0.9999871253967285, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999964237213135, | |
| 0.9999996423721313, | |
| 0.9999971389770508, | |
| 0.999998927116394, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999969005584717, | |
| 0.9999992847442627, | |
| 0.9999997615814209, | |
| 0.9999871253967285, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.999290943145752, | |
| 0.9999997615814209, | |
| 0.9999961853027344, | |
| 0.9999998807907104, | |
| 1.0, | |
| 0.9991438388824463, | |
| 0.9999996423721313 | |
| ], | |
| "eval_code_low_quality_runtime": 141.0508, | |
| "eval_code_low_quality_samples_per_second": 0.709, | |
| "eval_code_low_quality_steps_per_second": 0.028, | |
| "epoch": 1.32, | |
| "step": 50 | |
| }, | |
| { | |
| "eval_code_loss": 0.6208350658416748, | |
| "eval_code_score": -0.16615988314151764, | |
| "eval_code_brier_score": 0.16615988314151764, | |
| "eval_code_average_probability": 0.7172398567199707, | |
| "eval_code_accuracy": 0.78, | |
| "eval_code_probabilities": [ | |
| 0.00898885540664196, | |
| 0.011922608129680157, | |
| 0.06844734400510788, | |
| 1.0, | |
| 0.9941722750663757, | |
| 0.9803956151008606, | |
| 0.7216671705245972, | |
| 0.8719096779823303, | |
| 0.6083595752716064, | |
| 0.7415289282798767, | |
| 0.9492217898368835, | |
| 0.9170193672180176, | |
| 0.7766098380088806, | |
| 0.9932230710983276, | |
| 0.8845409750938416, | |
| 0.5273276567459106, | |
| 0.47327327728271484, | |
| 0.514703094959259, | |
| 0.8447608351707458, | |
| 0.9846923351287842, | |
| 0.8573033809661865, | |
| 0.6226664185523987, | |
| 0.9512245059013367, | |
| 0.9716692566871643, | |
| 0.015323023311793804, | |
| 0.01599641889333725, | |
| 0.012340807355940342, | |
| 0.9995960593223572, | |
| 0.9999792575836182, | |
| 0.9965634942054749, | |
| 0.44286829233169556, | |
| 0.9999172687530518, | |
| 0.6884943842887878, | |
| 0.6484965085983276, | |
| 0.09222234040498734, | |
| 0.08776669204235077, | |
| 0.9685974717140198, | |
| 0.9530619382858276, | |
| 0.7834113240242004, | |
| 0.9998219609260559, | |
| 0.9753877520561218, | |
| 0.9868707060813904, | |
| 0.8314498662948608, | |
| 0.9281793236732483, | |
| 0.8543185591697693, | |
| 0.8703754544258118, | |
| 0.9975754618644714, | |
| 0.9943013191223145, | |
| 0.6888080835342407, | |
| 0.631050169467926, | |
| 0.9991812109947205, | |
| 0.9999918937683105, | |
| 0.9999994039535522, | |
| 0.9998878240585327, | |
| 0.6626654863357544, | |
| 0.4978952705860138, | |
| 0.4795929491519928, | |
| 0.7897204160690308, | |
| 0.597411572933197, | |
| 0.758142352104187, | |
| 0.46403029561042786, | |
| 0.3406503200531006, | |
| 0.3812786936759949, | |
| 0.5821160674095154, | |
| 0.554485023021698, | |
| 0.5045574903488159, | |
| 0.9999997615814209, | |
| 0.3512322008609772, | |
| 0.3285271227359772, | |
| 0.7814154624938965, | |
| 0.7234558463096619, | |
| 0.8835054039955139, | |
| 0.5704320073127747, | |
| 0.7975870966911316, | |
| 0.7317837476730347, | |
| 0.9999594688415527, | |
| 0.9992265701293945, | |
| 0.9976761937141418, | |
| 0.998828113079071, | |
| 0.7545521855354309, | |
| 0.8591522574424744, | |
| 0.9943245053291321, | |
| 0.49560773372650146, | |
| 0.9899377822875977, | |
| 0.9942289590835571, | |
| 0.9932680726051331, | |
| 0.9997400641441345, | |
| 0.9999916553497314, | |
| 0.9999696016311646, | |
| 0.997422456741333, | |
| 0.6934857368469238, | |
| 0.7063461542129517, | |
| 0.6493465304374695, | |
| 0.48497462272644043, | |
| 0.48536550998687744, | |
| 0.584743857383728, | |
| 0.7083728313446045, | |
| 0.1657319813966751, | |
| 0.1531611829996109, | |
| 0.5006277561187744 | |
| ], | |
| "eval_code_runtime": 135.166, | |
| "eval_code_samples_per_second": 0.74, | |
| "eval_code_steps_per_second": 0.03, | |
| "epoch": 1.32, | |
| "step": 50 | |
| }, | |
| { | |
| "loss": 0.0007, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.34, | |
| "step": 51 | |
| }, | |
| { | |
| "loss": 0.0631, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.37, | |
| "step": 52 | |
| }, | |
| { | |
| "loss": 0.0133, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.39, | |
| "step": 53 | |
| }, | |
| { | |
| "loss": 0.0013, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.42, | |
| "step": 54 | |
| }, | |
| { | |
| "loss": 0.0011, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.45, | |
| "step": 55 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.47, | |
| "step": 56 | |
| }, | |
| { | |
| "loss": 0.0005, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.5, | |
| "step": 57 | |
| }, | |
| { | |
| "loss": 0.002, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.53, | |
| "step": 58 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.55, | |
| "step": 59 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.58, | |
| "step": 60 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.61, | |
| "step": 61 | |
| }, | |
| { | |
| "loss": 0.0022, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.63, | |
| "step": 62 | |
| }, | |
| { | |
| "loss": 0.001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.66, | |
| "step": 63 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.68, | |
| "step": 64 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.71, | |
| "step": 65 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.74, | |
| "step": 66 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.76, | |
| "step": 67 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.79, | |
| "step": 68 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.82, | |
| "step": 69 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.84, | |
| "step": 70 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.87, | |
| "step": 71 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.89, | |
| "step": 72 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.92, | |
| "step": 73 | |
| }, | |
| { | |
| "loss": 0.003, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.95, | |
| "step": 74 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.97, | |
| "step": 75 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 3.4825257898774e-05, | |
| "eval_code_low_quality_score": -8.544675722532702e-08, | |
| "eval_code_low_quality_brier_score": 8.544675722532702e-08, | |
| "eval_code_low_quality_average_probability": 0.9999703168869019, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999960660934448, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999958276748657, | |
| 0.9999983310699463, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9999992847442627, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9970769882202148, | |
| 1.0, | |
| 0.9999996423721313, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999990463256836, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999974966049194, | |
| 0.9999973773956299, | |
| 1.0, | |
| 0.9999992847442627, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999749660491943, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 0.9999997615814209, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 141.134, | |
| "eval_code_low_quality_samples_per_second": 0.709, | |
| "eval_code_low_quality_steps_per_second": 0.028, | |
| "epoch": 1.97, | |
| "step": 75 | |
| }, | |
| { | |
| "eval_code_loss": 0.41323670744895935, | |
| "eval_code_score": -0.12680457532405853, | |
| "eval_code_brier_score": 0.12680457532405853, | |
| "eval_code_average_probability": 0.7587159872055054, | |
| "eval_code_accuracy": 0.83, | |
| "eval_code_probabilities": [ | |
| 0.8840228915214539, | |
| 0.9449170827865601, | |
| 0.9977814555168152, | |
| 0.9999998807907104, | |
| 0.9982668161392212, | |
| 0.9896910190582275, | |
| 0.7586247324943542, | |
| 0.6018922924995422, | |
| 0.6262123584747314, | |
| 0.7324202060699463, | |
| 0.9547215104103088, | |
| 0.9301618337631226, | |
| 0.7506490349769592, | |
| 0.9963753819465637, | |
| 0.8704489469528198, | |
| 0.5361979603767395, | |
| 0.5121419429779053, | |
| 0.5582126975059509, | |
| 0.8438705205917358, | |
| 0.9842632412910461, | |
| 0.8747962713241577, | |
| 0.6529940962791443, | |
| 0.9806255102157593, | |
| 0.9927592277526855, | |
| 0.012452345341444016, | |
| 0.014053303748369217, | |
| 0.012323332950472832, | |
| 0.9999936819076538, | |
| 0.9999954700469971, | |
| 0.9993295669555664, | |
| 0.476261705160141, | |
| 0.9999690055847168, | |
| 0.7746478319168091, | |
| 0.7423850893974304, | |
| 0.3552600145339966, | |
| 0.3487190902233124, | |
| 0.961654782295227, | |
| 0.9592396020889282, | |
| 0.7986306548118591, | |
| 0.9999490976333618, | |
| 0.9817489385604858, | |
| 0.9756157994270325, | |
| 0.8439541459083557, | |
| 0.929361879825592, | |
| 0.9538075923919678, | |
| 0.929568350315094, | |
| 0.9999812841415405, | |
| 0.9999052286148071, | |
| 0.7754999995231628, | |
| 0.7285842895507812, | |
| 0.9990667700767517, | |
| 0.9999997615814209, | |
| 1.0, | |
| 0.9999964237213135, | |
| 0.6865420341491699, | |
| 0.4973016083240509, | |
| 0.45788219571113586, | |
| 0.8701395392417908, | |
| 0.515251874923706, | |
| 0.8549637794494629, | |
| 0.6026025414466858, | |
| 0.46106913685798645, | |
| 0.45153528451919556, | |
| 0.5452430248260498, | |
| 0.5482519268989563, | |
| 0.5275773406028748, | |
| 0.9999997615814209, | |
| 0.25358888506889343, | |
| 0.2506215274333954, | |
| 0.7635894417762756, | |
| 0.7153332829475403, | |
| 0.832649827003479, | |
| 0.5769205093383789, | |
| 0.85756516456604, | |
| 0.8781008720397949, | |
| 0.99993896484375, | |
| 0.9974363446235657, | |
| 0.9993440508842468, | |
| 0.9991888403892517, | |
| 0.7507019639015198, | |
| 0.829367995262146, | |
| 0.9905405044555664, | |
| 0.4980931282043457, | |
| 0.9923575520515442, | |
| 0.9980649352073669, | |
| 0.9964637160301208, | |
| 0.9999872446060181, | |
| 1.0, | |
| 1.0, | |
| 0.9999905824661255, | |
| 0.7705276608467102, | |
| 0.7632506489753723, | |
| 0.6713977456092834, | |
| 0.4876120388507843, | |
| 0.5282371640205383, | |
| 0.5807164311408997, | |
| 0.5882728099822998, | |
| 0.11337706446647644, | |
| 0.13702017068862915, | |
| 0.4889734983444214 | |
| ], | |
| "eval_code_runtime": 135.2481, | |
| "eval_code_samples_per_second": 0.739, | |
| "eval_code_steps_per_second": 0.03, | |
| "epoch": 1.97, | |
| "step": 75 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.0, | |
| "step": 76 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.03, | |
| "step": 77 | |
| }, | |
| { | |
| "loss": 0.0049, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.05, | |
| "step": 78 | |
| }, | |
| { | |
| "loss": 0.0312, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.08, | |
| "step": 79 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.11, | |
| "step": 80 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.13, | |
| "step": 81 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.16, | |
| "step": 82 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.18, | |
| "step": 83 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.21, | |
| "step": 84 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.24, | |
| "step": 85 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.26, | |
| "step": 86 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.29, | |
| "step": 87 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.32, | |
| "step": 88 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.34, | |
| "step": 89 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.37, | |
| "step": 90 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.39, | |
| "step": 91 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.42, | |
| "step": 92 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.45, | |
| "step": 93 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.47, | |
| "step": 94 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.5, | |
| "step": 95 | |
| }, | |
| { | |
| "loss": 0.0128, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.53, | |
| "step": 96 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.55, | |
| "step": 97 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.58, | |
| "step": 98 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.61, | |
| "step": 99 | |
| }, | |
| { | |
| "loss": 0.0007, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.63, | |
| "step": 100 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.00015671229630243033, | |
| "eval_code_low_quality_score": -1.3624161283587455e-06, | |
| "eval_code_low_quality_brier_score": 1.3624161283587455e-06, | |
| "eval_code_low_quality_average_probability": 0.9998810291290283, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9998458623886108, | |
| 0.9999973773956299, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9883288145065308, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.999997615814209, | |
| 0.9999912977218628, | |
| 1.0, | |
| 0.9999877214431763, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999679327011108, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999959468841553, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 141.0168, | |
| "eval_code_low_quality_samples_per_second": 0.709, | |
| "eval_code_low_quality_steps_per_second": 0.028, | |
| "epoch": 2.63, | |
| "step": 100 | |
| }, | |
| { | |
| "eval_code_loss": 1.384405493736267, | |
| "eval_code_score": -0.1918598711490631, | |
| "eval_code_brier_score": 0.1918598711490631, | |
| "eval_code_average_probability": 0.6802566051483154, | |
| "eval_code_accuracy": 0.82, | |
| "eval_code_probabilities": [ | |
| 2.7011897145712283e-06, | |
| 1.146102567872731e-05, | |
| 0.00012897477427031845, | |
| 0.9999865293502808, | |
| 0.9395932555198669, | |
| 0.8856058120727539, | |
| 0.7632039189338684, | |
| 0.6708762049674988, | |
| 0.6227125525474548, | |
| 0.7241858243942261, | |
| 0.9404862523078918, | |
| 0.9222924113273621, | |
| 0.6570658087730408, | |
| 0.9888173341751099, | |
| 0.79543137550354, | |
| 0.5034469962120056, | |
| 0.5368735194206238, | |
| 0.5535816550254822, | |
| 0.7554457187652588, | |
| 0.9272328615188599, | |
| 0.7993726134300232, | |
| 0.604550302028656, | |
| 0.8812964558601379, | |
| 0.9381894469261169, | |
| 0.002172264736145735, | |
| 0.0029873487073928118, | |
| 0.002684241160750389, | |
| 0.9999915361404419, | |
| 0.9999991655349731, | |
| 0.9999327659606934, | |
| 0.4827829599380493, | |
| 0.9303818345069885, | |
| 0.7092949151992798, | |
| 1.6805757923066267e-06, | |
| 7.52522396396671e-07, | |
| 1.1064344107580837e-06, | |
| 0.8093892931938171, | |
| 0.8280414342880249, | |
| 0.6371450424194336, | |
| 0.9915766716003418, | |
| 0.6807467937469482, | |
| 0.7864972949028015, | |
| 0.6430220007896423, | |
| 0.7116998434066772, | |
| 0.7039490938186646, | |
| 0.8259388208389282, | |
| 0.998793363571167, | |
| 0.9856457114219666, | |
| 0.7733932137489319, | |
| 0.6658198237419128, | |
| 0.9998243451118469, | |
| 0.999961256980896, | |
| 0.9999998807907104, | |
| 0.9991695880889893, | |
| 0.6490118503570557, | |
| 0.5122784376144409, | |
| 0.4935091733932495, | |
| 0.6350076198577881, | |
| 0.5762010216712952, | |
| 0.6138877868652344, | |
| 0.8648762702941895, | |
| 0.8143119215965271, | |
| 0.8287466764450073, | |
| 0.561292290687561, | |
| 0.5432232618331909, | |
| 0.5146270990371704, | |
| 0.997788667678833, | |
| 0.21196365356445312, | |
| 0.19605514407157898, | |
| 0.8330866098403931, | |
| 0.6678863763809204, | |
| 0.793769896030426, | |
| 0.5204634666442871, | |
| 0.7754390835762024, | |
| 0.7131609320640564, | |
| 0.9999798536300659, | |
| 0.9999628067016602, | |
| 0.995313286781311, | |
| 0.998515784740448, | |
| 0.7346359491348267, | |
| 0.769510805606842, | |
| 0.9687986969947815, | |
| 0.4848264753818512, | |
| 0.9456825256347656, | |
| 0.9103584289550781, | |
| 0.8984634280204773, | |
| 0.9972737431526184, | |
| 0.9999996423721313, | |
| 1.0, | |
| 0.999421238899231, | |
| 0.6589410901069641, | |
| 0.6035416722297668, | |
| 0.5996540784835815, | |
| 0.501044750213623, | |
| 0.5140662789344788, | |
| 0.5147275924682617, | |
| 0.3556048572063446, | |
| 0.07969348877668381, | |
| 0.09929317981004715, | |
| 0.49852368235588074 | |
| ], | |
| "eval_code_runtime": 135.256, | |
| "eval_code_samples_per_second": 0.739, | |
| "eval_code_steps_per_second": 0.03, | |
| "epoch": 2.63, | |
| "step": 100 | |
| }, | |
| { | |
| "train_runtime": 12458.6048, | |
| "train_samples_per_second": 0.257, | |
| "train_steps_per_second": 0.008, | |
| "total_flos": 0.0, | |
| "train_loss": 0.04692524675736063, | |
| "epoch": 2.63, | |
| "step": 100 | |
| } | |
| ] |