| { | |
| "step": [ | |
| 50, | |
| 100, | |
| 150, | |
| 200, | |
| 250, | |
| 300, | |
| 350, | |
| 400, | |
| 450, | |
| 500, | |
| 550, | |
| 600, | |
| 650, | |
| 700, | |
| 750, | |
| 800, | |
| 850, | |
| 900 | |
| ], | |
| "train_loss": [ | |
| 1.229721450805664, | |
| 1.1041190230846405, | |
| 1.025876224040985, | |
| 1.0216933679580689, | |
| 0.9389291417598724, | |
| 0.9820241594314575, | |
| 0.971408588886261, | |
| 0.9302374482154846, | |
| 0.9171168172359466, | |
| 0.921946108341217, | |
| 0.9294362807273865, | |
| 0.9058246970176697, | |
| 0.8852759146690369, | |
| 0.9285594654083252, | |
| 0.9111053240299225, | |
| 0.8563614284992218, | |
| 0.8970540463924408, | |
| 0.882376617193222 | |
| ], | |
| "val_nll": [ | |
| 1.245873212814331, | |
| 1.1079651455084483, | |
| 1.0574054757754008, | |
| 1.024699628353119, | |
| 1.0064872364203135, | |
| 0.9878634532292684, | |
| 0.9754222611586253, | |
| 0.9647026916344961, | |
| 0.9550074140230814, | |
| 0.9492202738920847, | |
| 0.9425136148929596, | |
| 0.93640163342158, | |
| 0.9316958208878835, | |
| 0.9284021159013113, | |
| 0.9264170686403911, | |
| 0.9249595264593761, | |
| 0.9239107569058737, | |
| 0.9228900790214538 | |
| ], | |
| "val_ppl": [ | |
| 3.475968734949889, | |
| 3.0281901944508567, | |
| 2.8788919363026415, | |
| 2.786258421829991, | |
| 2.735973287632187, | |
| 2.685490662172586, | |
| 2.652286932311601, | |
| 2.6240074011406005, | |
| 2.598689849594626, | |
| 2.58369429980331, | |
| 2.5664243198423558, | |
| 2.55078622052022, | |
| 2.5388108976642356, | |
| 2.530462559579264, | |
| 2.525444454042619, | |
| 2.521766193486182, | |
| 2.519122828264174, | |
| 2.516552927049002 | |
| ], | |
| "lr": [ | |
| 0.00019998312416333227, | |
| 0.0001979649067087574, | |
| 0.00019264940672148018, | |
| 0.00018421553219875658, | |
| 0.0001729471487418621, | |
| 0.00015922352526649803, | |
| 0.00014350656864820733, | |
| 0.00012632527695645993, | |
| 0.00010825793454723325, | |
| 8.991264828797319e-05, | |
| 7.190688002264308e-05, | |
| 5.484666416891109e-05, | |
| 3.9306209937284346e-05, | |
| 2.5808574716471856e-05, | |
| 1.4808059116167305e-05, | |
| 1e-05, | |
| 1e-05, | |
| 1e-05 | |
| ], | |
| "grad_norm": [ | |
| 0.3591911792755127, | |
| 0.36388659477233887, | |
| 0.37539058923721313, | |
| 0.3457748591899872, | |
| 0.29278653860092163, | |
| 0.3325034976005554, | |
| 0.31695958971977234, | |
| 0.31593164801597595, | |
| 0.31353333592414856, | |
| 0.3333532512187958, | |
| 0.3345634937286377, | |
| 0.31411102414131165, | |
| 0.29149293899536133, | |
| 0.3208323121070862, | |
| 0.2993287742137909, | |
| 0.30689114332199097, | |
| 0.3200317621231079, | |
| 0.30858248472213745 | |
| ], | |
| "tok_per_sec": [ | |
| 6706.525285452902, | |
| 6700.058062558346, | |
| 6697.280101536737, | |
| 6680.071604788786, | |
| 6683.553221953783, | |
| 6685.66879995729, | |
| 6679.849924100408, | |
| 6681.899978577697, | |
| 6684.255805925504, | |
| 6681.92172154577, | |
| 6684.531310449166, | |
| 6686.6788334140565, | |
| 6684.5712078021825, | |
| 6686.219542291029, | |
| 6687.095210911167, | |
| 6685.0861424049535, | |
| 6686.302034296362, | |
| 6687.162565026619 | |
| ], | |
| "vram_gb": [ | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224, | |
| 31.77780224 | |
| ], | |
| "elapsed_hr": [ | |
| 0.13572188032997978, | |
| 0.27170577141973706, | |
| 0.40772770815425446, | |
| 0.5450374044312372, | |
| 0.6809418523311614, | |
| 0.8168716543912887, | |
| 0.9538471115297741, | |
| 1.089776530795627, | |
| 1.2255665010213852, | |
| 1.3622162308295567, | |
| 1.4978528754578697, | |
| 1.633496529261271, | |
| 1.7701791963974636, | |
| 1.9058768606848187, | |
| 2.041743522816234, | |
| 2.1785142697228324, | |
| 2.314250492784712, | |
| 2.4500675496790145 | |
| ] | |
| } |