Instructions to use genies-models/llama-13b-code_low_quality with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use genies-models/llama-13b-code_low_quality with PEFT:
from peft import PeftModel from transformers import AutoModelForSequenceClassification base_model = AutoModelForSequenceClassification.from_pretrained("models/llama-13b") model = PeftModel.from_pretrained(base_model, "genies-models/llama-13b-code_low_quality") - Notebooks
- Google Colab
- Kaggle
Invalid JSON:Unterminated fractional number in JSONat line 1012, column 15
| [ | |
| { | |
| "loss": 0.6593, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.03, | |
| "step": 1 | |
| }, | |
| { | |
| "loss": 0.4945, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.05, | |
| "step": 2 | |
| }, | |
| { | |
| "loss": 0.3929, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.08, | |
| "step": 3 | |
| }, | |
| { | |
| "loss": 0.2804, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.11, | |
| "step": 4 | |
| }, | |
| { | |
| "loss": 0.276, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.13, | |
| "step": 5 | |
| }, | |
| { | |
| "loss": 0.3343, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.16, | |
| "step": 6 | |
| }, | |
| { | |
| "loss": 0.1975, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.18, | |
| "step": 7 | |
| }, | |
| { | |
| "loss": 0.274, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.21, | |
| "step": 8 | |
| }, | |
| { | |
| "loss": 0.2602, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.24, | |
| "step": 9 | |
| }, | |
| { | |
| "loss": 0.2084, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.26, | |
| "step": 10 | |
| }, | |
| { | |
| "loss": 0.1054, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.29, | |
| "step": 11 | |
| }, | |
| { | |
| "loss": 0.0939, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.32, | |
| "step": 12 | |
| }, | |
| { | |
| "loss": 0.135, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.34, | |
| "step": 13 | |
| }, | |
| { | |
| "loss": 0.0468, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.37, | |
| "step": 14 | |
| }, | |
| { | |
| "loss": 0.2461, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.39, | |
| "step": 15 | |
| }, | |
| { | |
| "loss": 0.1158, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.42, | |
| "step": 16 | |
| }, | |
| { | |
| "loss": 0.3144, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.45, | |
| "step": 17 | |
| }, | |
| { | |
| "loss": 0.1785, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.47, | |
| "step": 18 | |
| }, | |
| { | |
| "loss": 0.1156, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.5, | |
| "step": 19 | |
| }, | |
| { | |
| "loss": 0.0616, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.53, | |
| "step": 20 | |
| }, | |
| { | |
| "loss": 0.0447, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.55, | |
| "step": 21 | |
| }, | |
| { | |
| "loss": 0.0044, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.58, | |
| "step": 22 | |
| }, | |
| { | |
| "loss": 0.0612, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.61, | |
| "step": 23 | |
| }, | |
| { | |
| "loss": 0.0515, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.63, | |
| "step": 24 | |
| }, | |
| { | |
| "loss": 0.0108, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.66, | |
| "step": 25 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.010171000845730305, | |
| "eval_code_low_quality_score": -0.0019669600296765566, | |
| "eval_code_low_quality_brier_score": 0.0019669600296765566, | |
| "eval_code_low_quality_average_probability": 0.9910862445831299, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 0.9999916553497314, | |
| 0.9999791383743286, | |
| 0.9999998807907104, | |
| 0.9999997615814209, | |
| 0.9999990463256836, | |
| 0.9999992847442627, | |
| 0.9999996423721313, | |
| 0.9999985694885254, | |
| 0.9999996423721313, | |
| 0.9999994039535522, | |
| 0.9999995231628418, | |
| 0.9999998807907104, | |
| 0.9999997615814209, | |
| 0.9999998807907104, | |
| 0.9999974966049194, | |
| 0.9999810457229614, | |
| 0.9999998807907104, | |
| 0.9999997615814209, | |
| 0.9999979734420776, | |
| 0.9999966621398926, | |
| 0.9999923706054688, | |
| 0.9999973773956299, | |
| 0.9998645782470703, | |
| 0.9999245405197144, | |
| 0.9626507759094238, | |
| 0.9710566401481628, | |
| 0.9999980926513672, | |
| 0.9999955892562866, | |
| 0.9980201721191406, | |
| 0.9999994039535522, | |
| 0.9999995231628418, | |
| 0.9999991655349731, | |
| 0.999997615814209, | |
| 0.9999970197677612, | |
| 0.999995231628418, | |
| 0.999994158744812, | |
| 0.9999849796295166, | |
| 0.9999797344207764, | |
| 0.9999872446060181, | |
| 0.9999929666519165, | |
| 0.9999995231628418, | |
| 0.9999985694885254, | |
| 0.99998939037323, | |
| 0.9999997615814209, | |
| 0.9999953508377075, | |
| 0.999991774559021, | |
| 0.9996731281280518, | |
| 0.9995961785316467, | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 0.9999982118606567, | |
| 0.9999980926513672, | |
| 0.9999994039535522, | |
| 0.9999996423721313, | |
| 0.9999988079071045, | |
| 0.9999992847442627, | |
| 0.9999977350234985, | |
| 0.9999911785125732, | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 0.9999996423721313, | |
| 0.9999990463256836, | |
| 0.9917247295379639, | |
| 0.9974627494812012, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 0.9999995231628418, | |
| 0.9999998807907104, | |
| 1.0, | |
| 0.9999978542327881, | |
| 0.9999996423721313, | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 0.9999954700469971, | |
| 0.9999988079071045, | |
| 0.8898673057556152, | |
| 0.95624178647995, | |
| 0.9999982118606567, | |
| 0.9999994039535522, | |
| 0.9999997615814209, | |
| 0.9999995231628418, | |
| 0.9999998807907104, | |
| 0.9999997615814209, | |
| 0.7369291186332703, | |
| 0.6688874363899231, | |
| 0.9999933242797852, | |
| 0.9999909400939941, | |
| 0.9999688863754272, | |
| 0.9999462366104126, | |
| 0.9999872446060181, | |
| 0.9999003410339355, | |
| 0.9898979663848877, | |
| 0.9894485473632812, | |
| 0.9999990463256836, | |
| 0.9999994039535522, | |
| 0.9648559093475342, | |
| 0.992939829826355 | |
| ], | |
| "eval_code_low_quality_runtime": 108.3354, | |
| "eval_code_low_quality_samples_per_second": 0.923, | |
| "eval_code_low_quality_steps_per_second": 0.037, | |
| "epoch": 0.66, | |
| "step": 25 | |
| }, | |
| { | |
| "eval_code_loss": 0.775557279586792, | |
| "eval_code_score": -0.21216197311878204, | |
| "eval_code_brier_score": 0.21216197311878204, | |
| "eval_code_average_probability": 0.6170614361763, | |
| "eval_code_accuracy": 0.77, | |
| "eval_code_probabilities": [ | |
| 0.0018926338525488973, | |
| 0.012711296789348125, | |
| 0.007091669365763664, | |
| 0.6062625646591187, | |
| 0.9943353533744812, | |
| 0.5690382719039917, | |
| 0.6241586208343506, | |
| 0.662219226360321, | |
| 0.5325962901115417, | |
| 0.5391229391098022, | |
| 0.7178332805633545, | |
| 0.6171442866325378, | |
| 0.577951967716217, | |
| 0.8548311591148376, | |
| 0.7104359865188599, | |
| 0.5026382803916931, | |
| 0.5293322801589966, | |
| 0.5492123365402222, | |
| 0.6345873475074768, | |
| 0.7990339398384094, | |
| 0.5863059163093567, | |
| 0.48554468154907227, | |
| 0.6499708294868469, | |
| 0.5989818572998047, | |
| 0.2676376402378082, | |
| 0.2834436595439911, | |
| 0.28170374035835266, | |
| 0.8311360478401184, | |
| 0.9110060334205627, | |
| 0.9641320109367371, | |
| 0.45280739665031433, | |
| 0.7613933086395264, | |
| 0.5464147329330444, | |
| 0.01752450130879879, | |
| 0.005836487282067537, | |
| 0.006046702619642019, | |
| 0.5162467956542969, | |
| 0.5298649668693542, | |
| 0.5247464179992676, | |
| 0.9592331647872925, | |
| 0.8196842670440674, | |
| 0.7410209774971008, | |
| 0.796080470085144, | |
| 0.9008417725563049, | |
| 0.6857371926307678, | |
| 0.5978904962539673, | |
| 0.9823793768882751, | |
| 0.9868221282958984, | |
| 0.5604033470153809, | |
| 0.5046380758285522, | |
| 0.999763548374176, | |
| 0.9999983310699463, | |
| 0.9999935626983643, | |
| 0.9927141070365906, | |
| 0.516162097454071, | |
| 0.521334171295166, | |
| 0.513815701007843, | |
| 0.5127142667770386, | |
| 0.5125176906585693, | |
| 0.5335236191749573, | |
| 0.3885745108127594, | |
| 0.449074923992157, | |
| 0.43242695927619934, | |
| 0.42709216475486755, | |
| 0.509745180606842, | |
| 0.5419602394104004, | |
| 0.9643940329551697, | |
| 0.46200674772262573, | |
| 0.44968515634536743, | |
| 0.7517949342727661, | |
| 0.35403740406036377, | |
| 0.9996168613433838, | |
| 0.43991619348526, | |
| 0.2799178659915924, | |
| 0.6076914072036743, | |
| 0.9999991655349731, | |
| 0.9997984766960144, | |
| 0.9999959468841553, | |
| 0.9999561309814453, | |
| 0.6099094748497009, | |
| 0.6852646470069885, | |
| 0.8096278309822083, | |
| 0.5049552321434021, | |
| 0.818763017654419, | |
| 0.6465492248535156, | |
| 0.5962660312652588, | |
| 0.9850568175315857, | |
| 0.9976211190223694, | |
| 0.9992263317108154, | |
| 0.6331233978271484, | |
| 0.6343858242034912, | |
| 0.49390336871147156, | |
| 0.5998658537864685, | |
| 0.5048991441726685, | |
| 0.507156252861023, | |
| 0.5149410367012024, | |
| 0.9476234316825867, | |
| 0.39861536026000977, | |
| 0.34747856855392456, | |
| 0.5127823948860168 | |
| ], | |
| "eval_code_runtime": 105.3963, | |
| "eval_code_samples_per_second": 0.949, | |
| "eval_code_steps_per_second": 0.038, | |
| "epoch": 0.66, | |
| "step": 25 | |
| }, | |
| { | |
| "loss": 0.0077, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.68, | |
| "step": 26 | |
| }, | |
| { | |
| "loss": 0.0157, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.71, | |
| "step": 27 | |
| }, | |
| { | |
| "loss": 0.0055, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.74, | |
| "step": 28 | |
| }, | |
| { | |
| "loss": 0.0043, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.76, | |
| "step": 29 | |
| }, | |
| { | |
| "loss": 0.0007, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.79, | |
| "step": 30 | |
| }, | |
| { | |
| "loss": 0.0017, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.82, | |
| "step": 31 | |
| }, | |
| { | |
| "loss": 0.0046, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.84, | |
| "step": 32 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.87, | |
| "step": 33 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.89, | |
| "step": 34 | |
| }, | |
| { | |
| "loss": 0.0148, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.92, | |
| "step": 35 | |
| }, | |
| { | |
| "loss": 0.0026, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.95, | |
| "step": 36 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 0.97, | |
| "step": 37 | |
| }, | |
| { | |
| "loss": 0.0043, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.0, | |
| "step": 38 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.03, | |
| "step": 39 | |
| }, | |
| { | |
| "loss": 0.0004, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.05, | |
| "step": 40 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.08, | |
| "step": 41 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.11, | |
| "step": 42 | |
| }, | |
| { | |
| "loss": 0.0095, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.13, | |
| "step": 43 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.16, | |
| "step": 44 | |
| }, | |
| { | |
| "loss": 0.2013, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.18, | |
| "step": 45 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.21, | |
| "step": 46 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.24, | |
| "step": 47 | |
| }, | |
| { | |
| "loss": 0.0047, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.26, | |
| "step": 48 | |
| }, | |
| { | |
| "loss": 0.0004, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.29, | |
| "step": 49 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.32, | |
| "step": 50 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.001378062181174755, | |
| "eval_code_low_quality_score": -5.075635272078216e-05, | |
| "eval_code_low_quality_brier_score": 5.075635272078216e-05, | |
| "eval_code_low_quality_average_probability": 0.9987315535545349, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999840259552002, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.967201828956604, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9908334612846375, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999980926513672, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 0.999922513961792, | |
| 0.9999967813491821, | |
| 0.9999996423721313, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9702784419059753, | |
| 0.9449317455291748, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999991655349731, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 108.1154, | |
| "eval_code_low_quality_samples_per_second": 0.925, | |
| "eval_code_low_quality_steps_per_second": 0.037, | |
| "epoch": 1.32, | |
| "step": 50 | |
| }, | |
| { | |
| "eval_code_loss": 1.3461368083953857, | |
| "eval_code_score": -0.22116898000240326, | |
| "eval_code_brier_score": 0.22116898000240326, | |
| "eval_code_average_probability": 0.5982358455657959, | |
| "eval_code_accuracy": 0.8, | |
| "eval_code_probabilities": [ | |
| 4.050308746172959e-07, | |
| 2.979102418976254e-06, | |
| 2.6617096864356427e-06, | |
| 0.5738264918327332, | |
| 0.8691526651382446, | |
| 0.5516966581344604, | |
| 0.5616106986999512, | |
| 0.5491132140159607, | |
| 0.5290331244468689, | |
| 0.49235308170318604, | |
| 0.5810630321502686, | |
| 0.5722699761390686, | |
| 0.5287314057350159, | |
| 0.6949906349182129, | |
| 0.5635644197463989, | |
| 0.5054471492767334, | |
| 0.4994816780090332, | |
| 0.5129610896110535, | |
| 0.6220285296440125, | |
| 0.6764118671417236, | |
| 0.5921300649642944, | |
| 0.503677248954773, | |
| 0.5439413785934448, | |
| 0.5423399806022644, | |
| 0.431194007396698, | |
| 0.42188534140586853, | |
| 0.42363011837005615, | |
| 0.9709718227386475, | |
| 0.9995226860046387, | |
| 0.9999279975891113, | |
| 0.4847673773765564, | |
| 0.5603877305984497, | |
| 0.5247597694396973, | |
| 3.816174285020679e-06, | |
| 1.9298215647722827e-06, | |
| 1.9306407921249047e-06, | |
| 0.527335524559021, | |
| 0.5305987596511841, | |
| 0.5162070393562317, | |
| 0.946389377117157, | |
| 0.8050153255462646, | |
| 0.8141985535621643, | |
| 0.5671536326408386, | |
| 0.6023316383361816, | |
| 0.5614919066429138, | |
| 0.5858514904975891, | |
| 0.9122728705406189, | |
| 0.9817299842834473, | |
| 0.532357931137085, | |
| 0.5182923674583435, | |
| 0.9870670437812805, | |
| 0.999982476234436, | |
| 0.9999992847442627, | |
| 0.9999778270721436, | |
| 0.5067487359046936, | |
| 0.5095696449279785, | |
| 0.5025925040245056, | |
| 0.4237653911113739, | |
| 0.5117032527923584, | |
| 0.4223073124885559, | |
| 0.6444336175918579, | |
| 0.6726469993591309, | |
| 0.6397074460983276, | |
| 0.7292462587356567, | |
| 0.5063377618789673, | |
| 0.5283511281013489, | |
| 0.706869900226593, | |
| 0.46199607849121094, | |
| 0.4430694580078125, | |
| 0.9500992894172668, | |
| 0.22525879740715027, | |
| 0.9999823570251465, | |
| 0.47554466128349304, | |
| 0.51363205909729, | |
| 0.6031032800674438, | |
| 0.9999370574951172, | |
| 0.658456563949585, | |
| 0.9959049820899963, | |
| 0.902746856212616, | |
| 0.5577074289321899, | |
| 0.5983836650848389, | |
| 0.7882758975028992, | |
| 0.5046991109848022, | |
| 0.8182088732719421, | |
| 0.549981951713562, | |
| 0.5202911496162415, | |
| 0.9605872631072998, | |
| 0.9999349117279053, | |
| 0.9999911785125732, | |
| 0.7577045559883118, | |
| 0.6290202736854553, | |
| 0.5034119486808777, | |
| 0.569599449634552, | |
| 0.503978431224823, | |
| 0.507115364074707, | |
| 0.5144593715667725, | |
| 0.770204484462738, | |
| 0.23782096803188324, | |
| 0.22504965960979462, | |
| 0.5020108222961426 | |
| ], | |
| "eval_code_runtime": 105.4075, | |
| "eval_code_samples_per_second": 0.949, | |
| "eval_code_steps_per_second": 0.038, | |
| "epoch": 1.32, | |
| "step": 50 | |
| }, | |
| { | |
| "loss": 0.0015, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.34, | |
| "step": 51 | |
| }, | |
| { | |
| "loss": 0.0049, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.37, | |
| "step": 52 | |
| }, | |
| { | |
| "loss": 0.0119, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.39, | |
| "step": 53 | |
| }, | |
| { | |
| "loss": 0.0028, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.42, | |
| "step": 54 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.45, | |
| "step": 55 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.47, | |
| "step": 56 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.5, | |
| "step": 57 | |
| }, | |
| { | |
| "loss": 0.0024, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.53, | |
| "step": 58 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.55, | |
| "step": 59 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.58, | |
| "step": 60 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.61, | |
| "step": 61 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.63, | |
| "step": 62 | |
| }, | |
| { | |
| "loss": 0.0017, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.66, | |
| "step": 63 | |
| }, | |
| { | |
| "loss": 0.0018, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.68, | |
| "step": 64 | |
| }, | |
| { | |
| "loss": 0.0008, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.71, | |
| "step": 65 | |
| }, | |
| { | |
| "loss": 0.0068, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.74, | |
| "step": 66 | |
| }, | |
| { | |
| "loss": 0.001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.76, | |
| "step": 67 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.79, | |
| "step": 68 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.82, | |
| "step": 69 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.84, | |
| "step": 70 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.87, | |
| "step": 71 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.89, | |
| "step": 72 | |
| }, | |
| { | |
| "loss": 0.1335, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.92, | |
| "step": 73 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.95, | |
| "step": 74 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 1.97, | |
| "step": 75 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.0005032618064433336, | |
| "eval_code_low_quality_score": -1.0583773473626934e-05, | |
| "eval_code_low_quality_brier_score": 1.0583773473626934e-05, | |
| "eval_code_low_quality_average_probability": 0.9995136857032776, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 0.9999967813491821, | |
| 0.9999997615814209, | |
| 0.9983976483345032, | |
| 1.0, | |
| 0.9999837875366211, | |
| 1.0, | |
| 0.9997871518135071, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9918645620346069, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9998249411582947, | |
| 0.998837411403656, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9688511490821838, | |
| 0.9999998807907104, | |
| 1.0, | |
| 0.9999991655349731, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9999998807907104, | |
| 1.0, | |
| 0.999982476234436, | |
| 0.9999701976776123, | |
| 0.995941698551178, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999868869781494, | |
| 0.9999997615814209, | |
| 0.9999061822891235, | |
| 1.0, | |
| 1.0, | |
| 0.9999092817306519, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 0.9999997615814209, | |
| 1.0, | |
| 0.9999204874038696, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9989272952079773, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 0.9994589686393738, | |
| 1.0, | |
| 0.9999996423721313, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999737739562988, | |
| 0.999944806098938, | |
| 0.9999998807907104, | |
| 0.9999788999557495, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999411106109619, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.,, | |
| 0.9999876022338867, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 108.2376, | |
| "eval_code_low_quality_samples_per_second": 0.924, | |
| "eval_code_low_quality_steps_per_second": 0.037, | |
| "epoch": 1.97, | |
| "step": 75 | |
| }, | |
| { | |
| "eval_code_loss": 1.5990806818008423, | |
| "eval_code_score": -0.2409353256225586, | |
| "eval_code_brier_score": 0.2409353256225586, | |
| "eval_code_average_probability": 0.5683663487434387, | |
| "eval_code_accuracy": 0.8, | |
| "eval_code_probabilities": [ | |
| 1.1873796168515582e-08, | |
| 5.058638308241825e-08, | |
| 6.313541689451085e-08, | |
| 0.5709640979766846, | |
| 0.6853320002555847, | |
| 0.5568627715110779, | |
| 0.5487821102142334, | |
| 0.5347866415977478, | |
| 0.5317322611808777, | |
| 0.512122631072998, | |
| 0.5734414458274841, | |
| 0.5738123059272766, | |
| 0.5303495526313782, | |
| 0.6757323741912842, | |
| 0.6369258165359497, | |
| 0.5054691433906555, | |
| 0.4862286150455475, | |
| 0.4997119903564453, | |
| 0.5902368426322937, | |
| 0.6018257737159729, | |
| 0.541638970375061, | |
| 0.5033149123191833, | |
| 0.5362597703933716, | |
| 0.5289673209190369, | |
| 0.24309313297271729, | |
| 0.22363527119159698, | |
| 0.22765608131885529, | |
| 0.7798057794570923, | |
| 0.9960242509841919, | |
| 0.9997923970222473, | |
| 0.5013885498046875, | |
| 0.528499186038971, | |
| 0.5185747146606445, | |
| 4.462568199414818e-07, | |
| 2.2847591196750727e-07, | |
| 2.316882046216051e-07, | |
| 0.5187056660652161, | |
| 0.5277567505836487, | |
| 0.510230541229248, | |
| 0.9069125056266785, | |
| 0.8473342061042786, | |
| 0.8101637363433838, | |
| 0.537501335144043, | |
| 0.5229093432426453, | |
| 0.5179290175437927, | |
| 0.594524621963501, | |
| 0.8149073123931885, | |
| 0.9026350378990173, | |
| 0.5351212024688721, | |
| 0.5195194482803345, | |
| 0.9832677245140076, | |
| 0.9752768874168396, | |
| 0.9901442527770996, | |
| 0.9911841154098511, | |
| 0.5086742043495178, | |
| 0.5045136213302612, | |
| 0.5005779266357422, | |
| 0.4479965567588806, | |
| 0.5039933919906616, | |
| 0.44930532574653625, | |
| 0.5485993027687073, | |
| 0.6136952042579651, | |
| 0.5874925255775452, | |
| 0.6819684505462646, | |
| 0.5115750432014465, | |
| 0.5058901309967041, | |
| 0.7632222771644592, | |
| 0.3942977488040924, | |
| 0.3785106837749481, | |
| 0.8528256416320801, | |
| 0.5036994814872742, | |
| 0.9950182437896729, | |
| 0.48869040608406067, | |
| 0.5160850882530212, | |
| 0.5451788306236267, | |
| 0.9758601188659668, | |
| 0.44595080614089966, | |
| 0.8039615750312805, | |
| 0.8271895051002502, | |
| 0.5377886891365051, | |
| 0.5619093775749207, | |
| 0.8048967123031616, | |
| 0.502302885055542, | |
| 0.766408383846283, | |
| 0.5268206000328064, | |
| 0.5031132102012634, | |
| 0.8771815896034241, | |
| 0.9855904579162598, | |
| 0.9990859031677246, | |
| 0.6270195841789246, | |
| 0.55865478515625, | |
| 0.5030545592308044, | |
| 0.5426568984985352, | |
| 0.5039815306663513, | |
| 0.5092061758041382, | |
| 0.5093463659286499, | |
| 0.4080256521701813, | |
| 0.24740169942378998, | |
| 0.2555961608886719, | |
| 0.5028347373008728 | |
| ], | |
| "eval_code_runtime": 105.2631, | |
| "eval_code_samples_per_second": 0.95, | |
| "eval_code_steps_per_second": 0.038, | |
| "epoch": 1.97, | |
| "step": 75 | |
| }, | |
| { | |
| "loss": 0.012, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.0, | |
| "step": 76 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.03, | |
| "step": 77 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.05, | |
| "step": 78 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.08, | |
| "step": 79 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.11, | |
| "step": 80 | |
| }, | |
| { | |
| "loss": 0.005, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.13, | |
| "step": 81 | |
| }, | |
| { | |
| "loss": 0.0007, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.16, | |
| "step": 82 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.18, | |
| "step": 83 | |
| }, | |
| { | |
| "loss": 0.0019, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.21, | |
| "step": 84 | |
| }, | |
| { | |
| "loss": 0.0007, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.24, | |
| "step": 85 | |
| }, | |
| { | |
| "loss": 0.0014, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.26, | |
| "step": 86 | |
| }, | |
| { | |
| "loss": 0.0005, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.29, | |
| "step": 87 | |
| }, | |
| { | |
| "loss": 0.001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.32, | |
| "step": 88 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.34, | |
| "step": 89 | |
| }, | |
| { | |
| "loss": 0.0004, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.37, | |
| "step": 90 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.39, | |
| "step": 91 | |
| }, | |
| { | |
| "loss": 0.0006, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.42, | |
| "step": 92 | |
| }, | |
| { | |
| "loss": 0.0028, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.45, | |
| "step": 93 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.47, | |
| "step": 94 | |
| }, | |
| { | |
| "loss": 0.0024, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.5, | |
| "step": 95 | |
| }, | |
| { | |
| "loss": 0.0059, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.53, | |
| "step": 96 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.55, | |
| "step": 97 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.58, | |
| "step": 98 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.61, | |
| "step": 99 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.63, | |
| "step": 100 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 6.671607116004452e-05, | |
| "eval_code_low_quality_score": -3.4999186482309597e-07, | |
| "eval_code_low_quality_brier_score": 3.4999186482309597e-07, | |
| "eval_code_low_quality_average_probability": 0.9999365210533142, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.999998927116394, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999990463256836, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9996960163116455, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9940925240516663, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.,, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999983310699463, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999991655349731, | |
| 1.0, | |
| 0.9999901056289673, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999704360961914, | |
| 0.999913215637207, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 108.4514, | |
| "eval_code_low_quality_samples_per_second": 0.922, | |
| "eval_code_low_quality_steps_per_second": 0.037, | |
| "epoch": 2.63, | |
| "step": 100 | |
| }, | |
| { | |
| "eval_code_loss": 1.2588822841644287, | |
| "eval_code_score": -0.24486389756202698, | |
| "eval_code_brier_score": 0.24486389756202698, | |
| "eval_code_average_probability": 0.6122177839279175, | |
| "eval_code_accuracy": 0.78, | |
| "eval_code_probabilities": [ | |
| 3.716594960678776e-07, | |
| 4.86033532069996e-05, | |
| 5.94538141740486e-05, | |
| 0.7322285175323486, | |
| 0.992759108543396, | |
| 0.6937164068222046, | |
| 0.6719813346862793, | |
| 0.5284847021102905, | |
| 0.5714943408966064, | |
| 0.5305595397949219, | |
| 0.7621225118637085, | |
| 0.7049319744110107, | |
| 0.5994599461555481, | |
| 0.9482231736183167, | |
| 0.9427314400672913, | |
| 0.5233908295631409, | |
| 0.5151730179786682, | |
| 0.5592909455299377, | |
| 0.6389124989509583, | |
| 0.7489423155784607, | |
| 0.5400505661964417, | |
| 0.4894372224807739, | |
| 0.7627068758010864, | |
| 0.676575243473053, | |
| 0.001497809775173664, | |
| 0.0012255371548235416, | |
| 0.0013199239037930965, | |
| 0.9070805907249451, | |
| 0.9999668598175049, | |
| 0.9999922513961792, | |
| 0.48677918314933777, | |
| 0.6579598784446716, | |
| 0.5528249740600586, | |
| 0.0031468200031667948, | |
| 0.0008608169737271965, | |
| 0.0007525159744545817, | |
| 0.628882110118866, | |
| 0.5596430897712708, | |
| 0.5554695725440979, | |
| 0.9984580278396606, | |
| 0.989458441734314, | |
| 0.9929828643798828, | |
| 0.7459701895713806, | |
| 0.8483384251594543, | |
| 0.5955826044082642, | |
| 0.8648329377174377, | |
| 0.9960275888442993, | |
| 0.9993523955345154, | |
| 0.5829755067825317, | |
| 0.6307886838912964, | |
| 0.994866132736206, | |
| 0.9999991655349731, | |
| 0.9999984502792358, | |
| 0.9999934434890747, | |
| 0.5436527132987976, | |
| 0.5340330600738525, | |
| 0.5099152326583862, | |
| 0.5169093608856201, | |
| 0.5082399249076843, | |
| 0.5305851697921753, | |
| 0.0689636766910553, | |
| 0.09695249050855637, | |
| 0.09122244268655777, | |
| 0.4549616277217865, | |
| 0.5240060091018677, | |
| 0.539696216583252, | |
| 0.9665416479110718, | |
| 0.2522982358932495, | |
| 0.24534465372562408, | |
| 0.905021071434021, | |
| 0.31865352392196655, | |
| 0.999656081199646, | |
| 0.4672524631023407, | |
| 0.5117397308349609, | |
| 0.5817976593971252, | |
| 0.9999037981033325, | |
| 0.9686040282249451, | |
| 0.9996315240859985, | |
| 0.996566653251648, | |
| 0.7026336789131165, | |
| 0.7814198732376099, | |
| 0.8912621140480042, | |
| 0.5140696167945862, | |
| 0.9321841597557068, | |
| 0.673382580280304, | |
| 0.6223154664039612, | |
| 0.9992823004722595, | |
| 0.9998123049736023, | |
| 0.9999938011169434, | |
| 0.697952926158905, | |
| 0.7329107522964478, | |
| 0.4842481017112732, | |
| 0.6284154057502747, | |
| 0.5115850567817688, | |
| 0.525327205657959, | |
| 0.5679951310157776, | |
| 0.5145466923713684, | |
| 0.02526971884071827, | |
| 0.02999242953956127, | |
| 0.5247264504432678 | |
| ], | |
| "eval_code_runtime": 105.3153, | |
| "eval_code_samples_per_second": 0.95, | |
| "eval_code_steps_per_second": 0.038, | |
| "epoch": 2.63, | |
| "step": 100 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.66, | |
| "step": 101 | |
| }, | |
| { | |
| "loss": 0.0009, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.68, | |
| "step": 102 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.71, | |
| "step": 103 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.74, | |
| "step": 104 | |
| }, | |
| { | |
| "loss": 0.0016, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.76, | |
| "step": 105 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.79, | |
| "step": 106 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.82, | |
| "step": 107 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.84, | |
| "step": 108 | |
| }, | |
| { | |
| "loss": 0.0005, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.87, | |
| "step": 109 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.89, | |
| "step": 110 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.92, | |
| "step": 111 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.95, | |
| "step": 112 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 2.97, | |
| "step": 113 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.0, | |
| "step": 114 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.03, | |
| "step": 115 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.05, | |
| "step": 116 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.08, | |
| "step": 117 | |
| }, | |
| { | |
| "loss": 0.0002, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.11, | |
| "step": 118 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.13, | |
| "step": 119 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.16, | |
| "step": 120 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.18, | |
| "step": 121 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.21, | |
| "step": 122 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.24, | |
| "step": 123 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.26, | |
| "step": 124 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.29, | |
| "step": 125 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.0007014500442892313, | |
| "eval_code_low_quality_score": -3.61457969120238e-05, | |
| "eval_code_low_quality_brier_score": 3.61457969120238e-05, | |
| "eval_code_low_quality_average_probability": 0.9993457198143005, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.,, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9399757981300354, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.99994957447052, | |
| 0.9999979734420776, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9985740184783936, | |
| 0.9999673366546631, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9990741014480591, | |
| 0.9970368146896362, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 0.9999984502792358, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 108.4065, | |
| "eval_code_low_quality_samples_per_second": 0.922, | |
| "eval_code_low_quality_steps_per_second": 0.037, | |
| "epoch": 3.29, | |
| "step": 125 | |
| }, | |
| { | |
| "eval_code_loss": 1.043724775314331, | |
| "eval_code_score": -0.21790370345115662, | |
| "eval_code_brier_score": 0.21790370345115662, | |
| "eval_code_average_probability": 0.6578189134597778, | |
| "eval_code_accuracy": 0.77, | |
| "eval_code_probabilities": [ | |
| 2.9980761610204354e-05, | |
| 0.16327866911888123, | |
| 0.1223980113863945, | |
| 0.8630220293998718, | |
| 0.9999371767044067, | |
| 0.8081788420677185, | |
| 0.7690643668174744, | |
| 0.4431692361831665, | |
| 0.6145693063735962, | |
| 0.5692129731178284, | |
| 0.8545891046524048, | |
| 0.7837128043174744, | |
| 0.678038477897644, | |
| 0.9840186238288879, | |
| 0.9795506000518799, | |
| 0.541788637638092, | |
| 0.5379593372344971, | |
| 0.6108262538909912, | |
| 0.6568173766136169, | |
| 0.9312652349472046, | |
| 0.5693832039833069, | |
| 0.491776704788208, | |
| 0.865976095199585, | |
| 0.7813358306884766, | |
| 1.2309145859035198e-05, | |
| 9.09055961528793e-06, | |
| 1.0214143912889995e-05, | |
| 0.9485948085784912, | |
| 0.9997069239616394, | |
| 0.999749481678009, | |
| 0.45955172181129456, | |
| 0.8172199726104736, | |
| 0.5752690434455872, | |
| 0.6527258157730103, | |
| 0.2048613727092743, | |
| 0.13845929503440857, | |
| 0.7823963761329651, | |
| 0.6123839616775513, | |
| 0.6217948198318481, | |
| 0.9999850988388062, | |
| 0.999450147151947, | |
| 0.9998420476913452, | |
| 0.9847567677497864, | |
| 0.9996198415756226, | |
| 0.6785285472869873, | |
| 0.9706732630729675, | |
| 0.9999459981918335, | |
| 0.9999982118606567, | |
| 0.6881040930747986, | |
| 0.7350975871086121, | |
| 0.9948760867118835, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.5983561873435974, | |
| 0.5580247640609741, | |
| 0.5120639801025391, | |
| 0.5918711423873901, | |
| 0.5148324370384216, | |
| 0.6228303909301758, | |
| 0.006977998651564121, | |
| 0.011295206844806671, | |
| 0.012422475032508373, | |
| 0.4554630219936371, | |
| 0.5428009033203125, | |
| 0.5566087961196899, | |
| 0.9991586208343506, | |
| 0.11367473751306534, | |
| 0.12123917788267136, | |
| 0.9770430326461792, | |
| 0.1478639841079712, | |
| 0.9995866417884827, | |
| 0.4416849911212921, | |
| 0.491413414478302, | |
| 0.6343856453895569, | |
| 0.9999972581863403, | |
| 0.9927133917808533, | |
| 0.9999967813491821, | |
| 0.9998946189880371, | |
| 0.8279895186424255, | |
| 0.914436936378479, | |
| 0.9620551466941833, | |
| 0.5265487432479858, | |
| 0.9861032962799072, | |
| 0.8208467960357666, | |
| 0.7353063821792603, | |
| 0.9999938011169434, | |
| 0.9998844861984253, | |
| 0.999961256980896, | |
| 0.8301354050636292, | |
| 0.8745093941688538, | |
| 0.46109309792518616, | |
| 0.7134401798248291, | |
| 0.5036332011222839, | |
| 0.5366954207420349, | |
| 0.6171916127204895, | |
| 0.5420334339141846, | |
| 0.0013571635354310274, | |
| 0.0021216413006186485, | |
| 0.5408289432525635 | |
| ], | |
| "eval_code_runtime": 105.5069, | |
| "eval_code_samples_per_second": 0.948, | |
| "eval_code_steps_per_second": 0.038, | |
| "epoch": 3.29, | |
| "step": 125 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.32, | |
| "step": 126 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.34, | |
| "step": 127 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.37, | |
| "step": 128 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.39, | |
| "step": 129 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.42, | |
| "step": 130 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.45, | |
| "step": 131 | |
| }, | |
| { | |
| "loss": 0.0004, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.47, | |
| "step": 132 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.5, | |
| "step": 133 | |
| }, | |
| { | |
| "loss": 0.08, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.53, | |
| "step": 134 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.55, | |
| "step": 135 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.58, | |
| "step": 136 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.61, | |
| "step": 137 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.63, | |
| "step": 138 | |
| }, | |
| { | |
| "loss": 0.001, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.66, | |
| "step": 139 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.68, | |
| "step": 140 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.71, | |
| "step": 141 | |
| }, | |
| { | |
| "loss": 0.0, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.74, | |
| "step": 142 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.76, | |
| "step": 143 | |
| }, | |
| { | |
| "loss": 0.0114, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.79, | |
| "step": 144 | |
| }, | |
| { | |
| "loss": 0.006, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.82, | |
| "step": 145 | |
| }, | |
| { | |
| "loss": 0.0011, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.84, | |
| "step": 146 | |
| }, | |
| { | |
| "loss": 0.0042, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.87, | |
| "step": 147 | |
| }, | |
| { | |
| "loss": 0.0015, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.89, | |
| "step": 148 | |
| }, | |
| { | |
| "loss": 0.0003, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.92, | |
| "step": 149 | |
| }, | |
| { | |
| "loss": 0.0001, | |
| "learning_rate": 0.0002, | |
| "epoch": 3.95, | |
| "step": 150 | |
| }, | |
| { | |
| "eval_code_low_quality_loss": 0.00038435429451055825, | |
| "eval_code_low_quality_score": -6.823713192716241e-06, | |
| "eval_code_low_quality_brier_score": 6.823713192716241e-06, | |
| "eval_code_low_quality_average_probability": 0.9996289014816284, | |
| "eval_code_low_quality_accuracy": 1.0, | |
| "eval_code_low_quality_probabilities": [ | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999984502792358, | |
| 1.0, | |
| 1.0, | |
| 0.9999983310699463, | |
| 0.9999969005584717, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999916553497314, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999995231628418, | |
| 0.9999638795852661, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999983310699463, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9766356945037842, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9885169267654419, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999992847442627, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999996423721313, | |
| 1.0, | |
| 0.9999995231628418, | |
| 1.0, | |
| 0.9999998807907104, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999713897705078, | |
| 0.9978513717651367, | |
| 0.9999997615814209, | |
| 0.9999988079071045, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999997615814209, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 1.0, | |
| 0.9999719858169556, | |
| 1.0 | |
| ], | |
| "eval_code_low_quality_runtime": 108.3342, | |
| "eval_code_low_quality_samples_per_second": 0.923, | |
| "eval_code_low_quality_steps_per_second": 0.037, | |
| "epoch": 3.95, | |
| "step": 150 | |
| }, | |
| { | |
| "eval_code_loss": 2.0963048934936523, | |
| "eval_code_score": -0.2217760533094406, | |
| "eval_code_brier_score": 0.2217760533094406, | |
| "eval_code_average_probability": 0.6159726977348328, | |
| "eval_code_accuracy": 0.76, | |
| "eval_code_probabilities": [ | |
| 3.5287172489573138e-12, | |
| 5.817486076198364e-11, | |
| 1.8693878389708374e-10, | |
| 0.765636146068573, | |
| 0.9234081506729126, | |
| 0.7391408085823059, | |
| 0.659432590007782, | |
| 0.6729235053062439, | |
| 0.5623210668563843, | |
| 0.5150139331817627, | |
| 0.8085805177688599, | |
| 0.7596898674964905, | |
| 0.5972597002983093, | |
| 0.9820079803466797, | |
| 0.9745085835456848, | |
| 0.5273155570030212, | |
| 0.5324531197547913, | |
| 0.5789834260940552, | |
| 0.7247386574745178, | |
| 0.7544905543327332, | |
| 0.5884762406349182, | |
| 0.4842914938926697, | |
| 0.8123393058776855, | |
| 0.7054367661476135, | |
| 0.09308263659477234, | |
| 0.08973666280508041, | |
| 0.09202855080366135, | |
| 0.7089231014251709, | |
| 0.9720393419265747, | |
| 0.9964279532432556, | |
| 0.49923038482666016, | |
| 0.6134451031684875, | |
| 0.5499404072761536, | |
| 6.11895881186264e-11, | |
| 1.4576943818678245e-11, | |
| 1.735799351476608e-11, | |
| 0.6023713946342468, | |
| 0.553157389163971, | |
| 0.5503317713737488, | |
| 0.9796992540359497, | |
| 0.9182886481285095, | |
| 0.8607842922210693, | |
| 0.6422979831695557, | |
| 0.6638745665550232, | |
| 0.6075322031974792, | |
| 0.7293029427528381, | |
| 0.9844130873680115, | |
| 0.993526816368103, | |
| 0.547633707523346, | |
| 0.6227739453315735, | |
| 0.9998313188552856, | |
| 0.9999940395355225, | |
| 0.9999951124191284, | |
| 0.9999775886535645, | |
| 0.5366966128349304, | |
| 0.5250415802001953, | |
| 0.5051754117012024, | |
| 0.48833295702934265, | |
| 0.5131838321685791, | |
| 0.5317294597625732, | |
| 0.29897043108940125, | |
| 0.3597976565361023, | |
| 0.32535555958747864, | |
| 0.4676964282989502, | |
| 0.526648998260498, | |
| 0.548362672328949, | |
| 0.6692071557044983, | |
| 0.35373201966285706, | |
| 0.3534887731075287, | |
| 0.6637941002845764, | |
| 0.47728481888771057, | |
| 0.9986295700073242, | |
| 0.46758249402046204, | |
| 0.5160676836967468, | |
| 0.5609508156776428, | |
| 0.9999833106994629, | |
| 0.9855866432189941, | |
| 0.9997468590736389, | |
| 0.9985565543174744, | |
| 0.7168160080909729, | |
| 0.7617760300636292, | |
| 0.7155187726020813, | |
| 0.4970121681690216, | |
| 0.8666588664054871, | |
| 0.6338189840316772, | |
| 0.5993514060974121, | |
| 0.9967523813247681, | |
| 0.9662074446678162, | |
| 0.9995986819267273, | |
| 0.5130647420883179, | |
| 0.7217807173728943, | |
| 0.4925132691860199, | |
| 0.5792981386184692, | |
| 0.5104650259017944, | |
| 0.5129127502441406, | |
| 0.5114725828170776, | |
| 0.8539605140686035, | |
| 0.19493471086025238, | |
| 0.22762958705425262, | |
| 0.5150301456451416 | |
| ], | |
| "eval_code_runtime": 105.5057, | |
| "eval_code_samples_per_second": 0.948, | |
| "eval_code_steps_per_second": 0.038, | |
| "epoch": 3.95, | |
| "step": 150 | |
| }, | |
| { | |
| "train_runtime": 14494.0652, | |
| "train_samples_per_second": 0.331, | |
| "train_steps_per_second": 0.01, | |
| "total_flos": 0.0, | |
| "train_loss": 0.03708522860984015, | |
| "epoch": 3.95, | |
| "step": 150 | |
| } | |
| ] |