{"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 12000, "epoch": 0, "val_loss": 3.9863175749778748, "val_ppl": 53.85620233572836, "is_best": false, "timestamp": "2026-05-04T20:59:59.504631"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 12500, "epoch": 0, "val_loss": 3.9993658542633055, "val_ppl": 54.5635378248214, "is_best": false, "timestamp": "2026-05-04T21:03:40.210750"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 13000, "epoch": 0, "val_loss": 3.8980185985565186, "val_ppl": 49.30465993335737, "is_best": false, "timestamp": "2026-05-04T21:07:20.539646"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 13500, "epoch": 0, "val_loss": 4.0108379364013675, "val_ppl": 55.193099499479665, "is_best": false, "timestamp": "2026-05-04T21:11:00.351397"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 14000, "epoch": 0, "val_loss": 3.996466362476349, "val_ppl": 54.4055604327834, "is_best": false, "timestamp": "2026-05-04T21:14:41.071787"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 14500, "epoch": 0, "val_loss": 3.812811541557312, "val_ppl": 45.277559820706834, "is_best": true, "timestamp": "2026-05-04T21:18:21.800499"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 15000, "epoch": 0, "val_loss": 3.832418644428253, "val_ppl": 46.17408197361166, "is_best": false, "timestamp": "2026-05-04T21:21:59.680798"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 15500, "epoch": 0, "val_loss": 3.8438140153884888, "val_ppl": 46.70326214225701, "is_best": false, "timestamp": "2026-05-04T21:25:35.963292"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 16000, "epoch": 0, "val_loss": 3.849898660182953, "val_ppl": 46.98830120444446, "is_best": false, "timestamp": "2026-05-04T21:29:11.938730"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 16500, "epoch": 0, "val_loss": 3.909795415401459, "val_ppl": 49.88874446053632, "is_best": false, "timestamp": "2026-05-04T21:32:49.678245"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 17000, "epoch": 0, "val_loss": 3.8968958020210267, "val_ppl": 49.24933189887585, "is_best": false, "timestamp": "2026-05-04T21:36:27.607090"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 17500, "epoch": 0, "val_loss": 4.013467276096344, "val_ppl": 55.33841186094534, "is_best": false, "timestamp": "2026-05-04T21:40:03.896723"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 18000, "epoch": 0, "val_loss": 3.816865837574005, "val_ppl": 45.46150107532316, "is_best": false, "timestamp": "2026-05-04T21:43:39.397578"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 18500, "epoch": 0, "val_loss": 3.7777989864349366, "val_ppl": 43.71970808806943, "is_best": true, "timestamp": "2026-05-04T21:47:16.012613"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 19000, "epoch": 0, "val_loss": 3.772597849369049, "val_ppl": 43.49290621891045, "is_best": true, "timestamp": "2026-05-04T21:50:52.340681"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 19500, "epoch": 0, "val_loss": 3.804729461669922, "val_ppl": 44.91309775478298, "is_best": false, "timestamp": "2026-05-04T21:54:29.858721"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 20000, "epoch": 0, "val_loss": 3.7609264254570007, "val_ppl": 42.988232930167364, "is_best": true, "timestamp": "2026-05-04T21:58:05.590810"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 20500, "epoch": 0, "val_loss": 3.844603657722473, "val_ppl": 46.74015557957265, "is_best": false, "timestamp": "2026-05-04T22:01:41.893882"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 21000, "epoch": 0, "val_loss": 3.8787616729736327, "val_ppl": 48.36428716991975, "is_best": false, "timestamp": "2026-05-04T22:05:18.243747"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 21500, "epoch": 0, "val_loss": 3.85902978181839, "val_ppl": 47.41932195485685, "is_best": false, "timestamp": "2026-05-04T22:08:54.100097"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 22000, "epoch": 0, "val_loss": 3.7951119422912596, "val_ppl": 44.48321567991365, "is_best": false, "timestamp": "2026-05-04T22:12:34.826759"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 22500, "epoch": 0, "val_loss": 3.793329083919525, "val_ppl": 44.403979061259854, "is_best": false, "timestamp": "2026-05-04T22:16:16.250257"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 23000, "epoch": 0, "val_loss": 3.802736735343933, "val_ppl": 44.823687357318825, "is_best": false, "timestamp": "2026-05-04T22:19:56.618702"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 23500, "epoch": 0, "val_loss": 3.743816339969635, "val_ppl": 42.258957364917784, "is_best": true, "timestamp": "2026-05-04T22:23:37.079401"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 24000, "epoch": 0, "val_loss": 3.8505793809890747, "val_ppl": 47.02029800792802, "is_best": false, "timestamp": "2026-05-04T22:27:13.809411"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 24500, "epoch": 0, "val_loss": 3.6836650729179383, "val_ppl": 39.79196760363053, "is_best": true, "timestamp": "2026-05-04T22:30:49.533366"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 25000, "epoch": 0, "val_loss": 3.790373718738556, "val_ppl": 44.272942813003034, "is_best": false, "timestamp": "2026-05-04T22:34:25.781566"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 25500, "epoch": 0, "val_loss": 3.772153317928314, "val_ppl": 43.47357655128801, "is_best": false, "timestamp": "2026-05-04T22:38:00.959868"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 26000, "epoch": 0, "val_loss": 3.8301936626434325, "val_ppl": 46.07145969098069, "is_best": false, "timestamp": "2026-05-04T22:41:35.514732"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 26500, "epoch": 0, "val_loss": 3.786704921722412, "val_ppl": 44.11081196695457, "is_best": false, "timestamp": "2026-05-04T22:45:11.828341"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 27000, "epoch": 0, "val_loss": 3.7141265153884886, "val_ppl": 41.02273869918982, "is_best": false, "timestamp": "2026-05-04T22:48:48.977554"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 27500, "epoch": 0, "val_loss": 3.8283850073814394, "val_ppl": 45.98820761283225, "is_best": false, "timestamp": "2026-05-04T22:52:23.338057"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 28000, "epoch": 0, "val_loss": 3.715892422199249, "val_ppl": 41.09524503372762, "is_best": false, "timestamp": "2026-05-04T22:55:57.343896"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 28500, "epoch": 0, "val_loss": 3.7689138054847717, "val_ppl": 43.33297122839589, "is_best": false, "timestamp": "2026-05-04T22:59:35.084593"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 29000, "epoch": 0, "val_loss": 3.803325188159943, "val_ppl": 44.85007174459031, "is_best": false, "timestamp": "2026-05-04T23:03:12.043553"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 29500, "epoch": 0, "val_loss": 3.666334068775177, "val_ppl": 39.10827450516796, "is_best": true, "timestamp": "2026-05-04T23:06:47.310567"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 30000, "epoch": 0, "val_loss": 3.7948907256126403, "val_ppl": 44.473376339039916, "is_best": false, "timestamp": "2026-05-04T23:10:23.410240"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 30500, "epoch": 0, "val_loss": 3.812023639678955, "val_ppl": 45.241899596500296, "is_best": false, "timestamp": "2026-05-04T23:13:58.332153"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 31000, "epoch": 0, "val_loss": 3.675893270969391, "val_ppl": 39.483910940532915, "is_best": false, "timestamp": "2026-05-04T23:17:34.037102"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 31500, "epoch": 0, "val_loss": 3.738007938861847, "val_ppl": 42.01421186824429, "is_best": false, "timestamp": "2026-05-04T23:21:09.271499"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 32000, "epoch": 0, "val_loss": 3.8809256076812746, "val_ppl": 48.469057646889524, "is_best": false, "timestamp": "2026-05-04T23:24:45.122386"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 32500, "epoch": 0, "val_loss": 3.8831029653549196, "val_ppl": 48.57470709807361, "is_best": false, "timestamp": "2026-05-04T23:28:19.588133"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 33000, "epoch": 0, "val_loss": 3.782689297199249, "val_ppl": 43.93403468183204, "is_best": false, "timestamp": "2026-05-04T23:31:54.513127"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 33500, "epoch": 0, "val_loss": 3.7974807739257814, "val_ppl": 44.588713832770054, "is_best": false, "timestamp": "2026-05-04T23:35:31.287826"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 34000, "epoch": 0, "val_loss": 3.755391275882721, "val_ppl": 42.75094395179436, "is_best": false, "timestamp": "2026-05-04T23:39:06.900594"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 34500, "epoch": 0, "val_loss": 3.6980305790901182, "val_ppl": 40.36772498147992, "is_best": false, "timestamp": "2026-05-04T23:42:45.306237"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 35000, "epoch": 0, "val_loss": 3.748930037021637, "val_ppl": 42.47561034735333, "is_best": false, "timestamp": "2026-05-04T23:46:22.382235"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 35500, "epoch": 0, "val_loss": 3.8731701374053955, "val_ppl": 48.094611192011875, "is_best": false, "timestamp": "2026-05-04T23:50:00.736529"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 36000, "epoch": 0, "val_loss": 3.8187678933143614, "val_ppl": 45.54805367224632, "is_best": false, "timestamp": "2026-05-04T23:53:38.469138"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 36500, "epoch": 0, "val_loss": 3.642268753051758, "val_ppl": 38.17835580431779, "is_best": true, "timestamp": "2026-05-04T23:57:14.388749"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 37000, "epoch": 0, "val_loss": 3.6575311541557314, "val_ppl": 38.76551854290175, "is_best": false, "timestamp": "2026-05-05T00:00:51.741991"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 37500, "epoch": 0, "val_loss": 3.639414060115814, "val_ppl": 38.069523736673105, "is_best": true, "timestamp": "2026-05-05T00:04:27.830597"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 38000, "epoch": 0, "val_loss": 3.7348302245140075, "val_ppl": 41.88091460685559, "is_best": false, "timestamp": "2026-05-05T00:08:03.818764"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 38500, "epoch": 0, "val_loss": 3.76340229511261, "val_ppl": 43.09479805787405, "is_best": false, "timestamp": "2026-05-05T00:11:38.899989"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 39000, "epoch": 0, "val_loss": 3.663316512107849, "val_ppl": 38.99044094482259, "is_best": false, "timestamp": "2026-05-05T00:15:13.596636"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 39500, "epoch": 0, "val_loss": 3.6712753891944887, "val_ppl": 39.30199925439836, "is_best": false, "timestamp": "2026-05-05T00:18:48.089176"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 40000, "epoch": 0, "val_loss": 3.722728192806244, "val_ppl": 41.37712503770513, "is_best": false, "timestamp": "2026-05-05T00:22:22.673948"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 40500, "epoch": 0, "val_loss": 3.770984923839569, "val_ppl": 43.42281194373766, "is_best": false, "timestamp": "2026-05-05T00:25:57.668102"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 41000, "epoch": 0, "val_loss": 3.552431809902191, "val_ppl": 34.898079879036295, "is_best": true, "timestamp": "2026-05-05T00:29:32.958417"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 41500, "epoch": 0, "val_loss": 3.747627294063568, "val_ppl": 42.420311572948926, "is_best": false, "timestamp": "2026-05-05T00:33:08.355133"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 42000, "epoch": 0, "val_loss": 3.6810667157173156, "val_ppl": 39.68870806875473, "is_best": false, "timestamp": "2026-05-05T00:36:42.580968"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 42500, "epoch": 0, "val_loss": 3.7633370995521545, "val_ppl": 43.09198855994634, "is_best": false, "timestamp": "2026-05-05T00:40:17.011458"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 43000, "epoch": 0, "val_loss": 3.615912067890167, "val_ppl": 37.185245932545655, "is_best": false, "timestamp": "2026-05-05T00:43:51.844020"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 43500, "epoch": 0, "val_loss": 3.6781845092773438, "val_ppl": 39.57448170981275, "is_best": false, "timestamp": "2026-05-05T00:47:26.919631"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 44000, "epoch": 0, "val_loss": 3.6713991284370424, "val_ppl": 39.30686275491367, "is_best": false, "timestamp": "2026-05-05T00:51:04.835836"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 44500, "epoch": 0, "val_loss": 3.699683153629303, "val_ppl": 40.43449080854727, "is_best": false, "timestamp": "2026-05-05T00:54:40.453262"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 45000, "epoch": 0, "val_loss": 3.7241574883461, "val_ppl": 41.43630746248623, "is_best": false, "timestamp": "2026-05-05T00:58:17.458978"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 45500, "epoch": 0, "val_loss": 3.7611931204795837, "val_ppl": 42.99969920685097, "is_best": false, "timestamp": "2026-05-05T01:01:54.445349"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 46000, "epoch": 0, "val_loss": 3.7802424907684324, "val_ppl": 43.82666800953869, "is_best": false, "timestamp": "2026-05-05T01:05:28.095918"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 46500, "epoch": 0, "val_loss": 3.654506039619446, "val_ppl": 38.648425608316444, "is_best": false, "timestamp": "2026-05-05T01:09:01.956376"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 47000, "epoch": 0, "val_loss": 3.791075897216797, "val_ppl": 44.304041237659206, "is_best": false, "timestamp": "2026-05-05T01:12:35.113869"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 47500, "epoch": 0, "val_loss": 3.765990149974823, "val_ppl": 43.206465567898896, "is_best": false, "timestamp": "2026-05-05T01:16:07.821939"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 48000, "epoch": 0, "val_loss": 3.6301537990570067, "val_ppl": 37.71861725886971, "is_best": false, "timestamp": "2026-05-05T01:19:41.674618"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 48500, "epoch": 0, "val_loss": 3.85994348526001, "val_ppl": 47.46266895266112, "is_best": false, "timestamp": "2026-05-05T01:23:14.931355"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 49000, "epoch": 0, "val_loss": 3.7905235290527344, "val_ppl": 44.279575853311975, "is_best": false, "timestamp": "2026-05-05T01:26:48.890788"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 49500, "epoch": 0, "val_loss": 3.7553041696548464, "val_ppl": 42.74722024051022, "is_best": false, "timestamp": "2026-05-05T01:30:22.140454"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 50000, "epoch": 0, "val_loss": 3.718538928031921, "val_ppl": 41.204147881852954, "is_best": false, "timestamp": "2026-05-05T01:33:56.237159"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 50500, "epoch": 0, "val_loss": 3.7871594190597535, "val_ppl": 44.13086477016917, "is_best": false, "timestamp": "2026-05-05T01:37:29.804904"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 51000, "epoch": 0, "val_loss": 3.6975579500198363, "val_ppl": 40.34865052907795, "is_best": false, "timestamp": "2026-05-05T01:41:03.626884"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 51500, "epoch": 0, "val_loss": 3.7123099088668825, "val_ppl": 40.948284172299644, "is_best": false, "timestamp": "2026-05-05T01:44:36.590819"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 52000, "epoch": 0, "val_loss": 3.6105751514434816, "val_ppl": 36.98732000880116, "is_best": false, "timestamp": "2026-05-05T01:48:10.949076"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 52500, "epoch": 0, "val_loss": 3.748972177505493, "val_ppl": 42.47740032784051, "is_best": false, "timestamp": "2026-05-05T01:51:44.887522"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 53000, "epoch": 0, "val_loss": 3.536519932746887, "val_ppl": 34.347180464321134, "is_best": true, "timestamp": "2026-05-05T01:55:19.914524"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 53500, "epoch": 0, "val_loss": 3.7042893409729003, "val_ppl": 40.62116925624361, "is_best": false, "timestamp": "2026-05-05T01:58:56.094996"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 54000, "epoch": 0, "val_loss": 3.528304159641266, "val_ppl": 34.06614785367218, "is_best": true, "timestamp": "2026-05-05T02:02:36.543228"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 54500, "epoch": 0, "val_loss": 3.688965547084808, "val_ppl": 40.00344386707912, "is_best": false, "timestamp": "2026-05-05T02:06:13.936633"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 55000, "epoch": 0, "val_loss": 3.687112832069397, "val_ppl": 39.92939750054665, "is_best": false, "timestamp": "2026-05-05T02:09:49.921760"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 55500, "epoch": 0, "val_loss": 3.707573747634888, "val_ppl": 40.75480503215183, "is_best": false, "timestamp": "2026-05-05T02:13:25.278363"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 56000, "epoch": 0, "val_loss": 3.724093532562256, "val_ppl": 41.4336574557054, "is_best": false, "timestamp": "2026-05-05T02:17:00.358077"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 56500, "epoch": 0, "val_loss": 3.6532342433929443, "val_ppl": 38.59930392947151, "is_best": false, "timestamp": "2026-05-05T02:20:34.406624"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 57000, "epoch": 0, "val_loss": 3.6039551854133607, "val_ppl": 36.743273886571934, "is_best": false, "timestamp": "2026-05-05T02:24:08.529184"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 57500, "epoch": 0, "val_loss": 3.690984618663788, "val_ppl": 40.08429527857909, "is_best": false, "timestamp": "2026-05-05T02:27:42.348235"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 58000, "epoch": 0, "val_loss": 3.7980252385139464, "val_ppl": 44.61299741866023, "is_best": false, "timestamp": "2026-05-05T02:31:15.494315"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 58500, "epoch": 0, "val_loss": 3.7596939325332643, "val_ppl": 42.935282874264374, "is_best": false, "timestamp": "2026-05-05T02:34:49.636452"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 59000, "epoch": 0, "val_loss": 3.7567172765731813, "val_ppl": 42.80766933362843, "is_best": false, "timestamp": "2026-05-05T02:38:23.899072"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 59500, "epoch": 0, "val_loss": 3.6661568880081177, "val_ppl": 39.101345884920015, "is_best": false, "timestamp": "2026-05-05T02:41:58.314158"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 60000, "epoch": 0, "val_loss": 3.829219877719879, "val_ppl": 46.02661783483271, "is_best": false, "timestamp": "2026-05-05T02:45:33.015118"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 60500, "epoch": 0, "val_loss": 3.6592538833618162, "val_ppl": 38.8323585910055, "is_best": false, "timestamp": "2026-05-05T02:49:07.008367"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 61000, "epoch": 0, "val_loss": 3.6369224905967714, "val_ppl": 37.974788939901174, "is_best": false, "timestamp": "2026-05-05T02:52:41.826436"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 61500, "epoch": 0, "val_loss": 3.640268337726593, "val_ppl": 38.10205957379428, "is_best": false, "timestamp": "2026-05-05T02:56:17.487129"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 62000, "epoch": 0, "val_loss": 3.7314751744270325, "val_ppl": 41.740637490620905, "is_best": false, "timestamp": "2026-05-05T02:59:52.254509"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 62500, "epoch": 0, "val_loss": 3.607824993133545, "val_ppl": 36.88573876958596, "is_best": false, "timestamp": "2026-05-05T03:03:27.488521"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 63000, "epoch": 0, "val_loss": 3.497276210784912, "val_ppl": 33.02537517856575, "is_best": true, "timestamp": "2026-05-05T03:07:01.428002"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 63500, "epoch": 0, "val_loss": 3.751301980018616, "val_ppl": 42.57647965469087, "is_best": false, "timestamp": "2026-05-05T03:10:39.967541"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 64000, "epoch": 0, "val_loss": 3.785206985473633, "val_ppl": 44.04478624625217, "is_best": false, "timestamp": "2026-05-05T03:14:09.552152"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 64500, "epoch": 0, "val_loss": 3.6670176506042482, "val_ppl": 39.13501735040617, "is_best": false, "timestamp": "2026-05-05T03:17:40.120467"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 65000, "epoch": 0, "val_loss": 3.6048176407814028, "val_ppl": 36.774976989665426, "is_best": false, "timestamp": "2026-05-05T03:21:09.621984"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 65500, "epoch": 0, "val_loss": 3.68316490650177, "val_ppl": 39.77206997427974, "is_best": false, "timestamp": "2026-05-05T03:24:39.232220"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 66000, "epoch": 0, "val_loss": 3.6640037536621093, "val_ppl": 39.017246005779675, "is_best": false, "timestamp": "2026-05-05T03:28:09.790645"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 66500, "epoch": 0, "val_loss": 3.5959048748016356, "val_ppl": 36.44866655023838, "is_best": false, "timestamp": "2026-05-05T03:31:40.643166"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 67000, "epoch": 0, "val_loss": 3.7562708497047423, "val_ppl": 42.78856310494689, "is_best": false, "timestamp": "2026-05-05T03:35:11.086634"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 67500, "epoch": 0, "val_loss": 3.5145472645759583, "val_ppl": 33.600712247137416, "is_best": false, "timestamp": "2026-05-05T03:38:41.101123"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 68000, "epoch": 0, "val_loss": 3.6910828351974487, "val_ppl": 40.08823241245824, "is_best": false, "timestamp": "2026-05-05T03:42:10.953259"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 68500, "epoch": 0, "val_loss": 3.8013942003250123, "val_ppl": 44.7635503644065, "is_best": false, "timestamp": "2026-05-05T03:45:40.080018"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 69000, "epoch": 0, "val_loss": 3.658419907093048, "val_ppl": 38.79998682599847, "is_best": false, "timestamp": "2026-05-05T03:49:08.561564"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 69500, "epoch": 0, "val_loss": 3.8823310852050783, "val_ppl": 48.53722771253796, "is_best": false, "timestamp": "2026-05-05T03:52:37.799746"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 70000, "epoch": 0, "val_loss": 3.713327670097351, "val_ppl": 40.989980963473904, "is_best": false, "timestamp": "2026-05-05T03:56:07.108614"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 70500, "epoch": 0, "val_loss": 3.6645475745201113, "val_ppl": 39.03847016852754, "is_best": false, "timestamp": "2026-05-05T03:59:35.499171"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 71000, "epoch": 0, "val_loss": 3.6358020663261414, "val_ppl": 37.93226489163729, "is_best": false, "timestamp": "2026-05-05T04:03:04.490368"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 71500, "epoch": 0, "val_loss": 3.714549744129181, "val_ppl": 41.04010437579673, "is_best": false, "timestamp": "2026-05-05T04:06:33.754519"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 72000, "epoch": 0, "val_loss": 3.724819552898407, "val_ppl": 41.463750056217506, "is_best": false, "timestamp": "2026-05-05T04:10:02.950489"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 72500, "epoch": 0, "val_loss": 3.706956958770752, "val_ppl": 40.72967567279914, "is_best": false, "timestamp": "2026-05-05T04:13:32.753044"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 73000, "epoch": 0, "val_loss": 3.720665693283081, "val_ppl": 41.291872683735996, "is_best": false, "timestamp": "2026-05-05T04:17:02.264757"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 73500, "epoch": 0, "val_loss": 3.7619191646575927, "val_ppl": 43.03093022429351, "is_best": false, "timestamp": "2026-05-05T04:20:31.644524"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 74000, "epoch": 0, "val_loss": 3.7080879330635073, "val_ppl": 40.77576594748239, "is_best": false, "timestamp": "2026-05-05T04:24:01.396289"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 74500, "epoch": 0, "val_loss": 3.668335270881653, "val_ppl": 39.18661642935482, "is_best": false, "timestamp": "2026-05-05T04:27:30.551942"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 75000, "epoch": 0, "val_loss": 3.646988558769226, "val_ppl": 38.35897613746714, "is_best": false, "timestamp": "2026-05-05T04:30:59.989095"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 75500, "epoch": 0, "val_loss": 3.7617430686950684, "val_ppl": 43.023353318368194, "is_best": false, "timestamp": "2026-05-05T04:34:29.068254"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 76000, "epoch": 0, "val_loss": 3.541844880580902, "val_ppl": 34.53056523237709, "is_best": false, "timestamp": "2026-05-05T04:37:59.028500"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 76500, "epoch": 0, "val_loss": 3.680254328250885, "val_ppl": 39.656478552960735, "is_best": false, "timestamp": "2026-05-05T04:41:28.477721"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 77000, "epoch": 0, "val_loss": 3.645061802864075, "val_ppl": 38.285138909678764, "is_best": false, "timestamp": "2026-05-05T04:44:57.542724"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 77500, "epoch": 0, "val_loss": 3.615162217617035, "val_ppl": 37.157373017289224, "is_best": false, "timestamp": "2026-05-05T04:48:26.395231"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 78000, "epoch": 0, "val_loss": 3.667114770412445, "val_ppl": 39.138818320356776, "is_best": false, "timestamp": "2026-05-05T04:51:55.154634"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 78500, "epoch": 0, "val_loss": 3.6738196134567263, "val_ppl": 39.40211966483728, "is_best": false, "timestamp": "2026-05-05T04:55:24.168296"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 79000, "epoch": 0, "val_loss": 3.5766518473625184, "val_ppl": 35.75363160589735, "is_best": false, "timestamp": "2026-05-05T04:58:53.097006"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 79500, "epoch": 0, "val_loss": 3.6736133217811586, "val_ppl": 39.393992173896386, "is_best": false, "timestamp": "2026-05-05T05:02:22.534742"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 80000, "epoch": 0, "val_loss": 3.7694395780563354, "val_ppl": 43.355760506575855, "is_best": false, "timestamp": "2026-05-05T05:05:51.139952"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 80500, "epoch": 0, "val_loss": 3.673647201061249, "val_ppl": 39.3953268365997, "is_best": false, "timestamp": "2026-05-05T05:09:20.334475"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 81000, "epoch": 0, "val_loss": 3.5661979794502257, "val_ppl": 35.38181471216213, "is_best": false, "timestamp": "2026-05-05T05:12:50.088072"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 81500, "epoch": 0, "val_loss": 3.662993311882019, "val_ppl": 38.9778412617239, "is_best": false, "timestamp": "2026-05-05T05:16:17.663732"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 82000, "epoch": 0, "val_loss": 4.2208603620529175, "val_ppl": 68.09204290482313, "is_best": false, "timestamp": "2026-05-05T05:19:45.079006"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 82500, "epoch": 0, "val_loss": 3.5309290766716, "val_ppl": 34.155686129192006, "is_best": false, "timestamp": "2026-05-05T05:23:12.931143"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 83000, "epoch": 0, "val_loss": 3.5450966119766236, "val_ppl": 34.64303211239782, "is_best": false, "timestamp": "2026-05-05T05:26:40.835777"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 83500, "epoch": 0, "val_loss": 3.542018008232117, "val_ppl": 34.53654394555625, "is_best": false, "timestamp": "2026-05-05T05:30:09.353422"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 84000, "epoch": 0, "val_loss": 3.658814322948456, "val_ppl": 38.81529317432707, "is_best": false, "timestamp": "2026-05-05T05:33:37.801618"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 84500, "epoch": 0, "val_loss": 3.653587245941162, "val_ppl": 38.6129319873461, "is_best": false, "timestamp": "2026-05-05T05:37:07.033376"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 85000, "epoch": 0, "val_loss": 3.6783868193626406, "val_ppl": 39.58248883651697, "is_best": false, "timestamp": "2026-05-05T05:40:34.896439"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 85500, "epoch": 0, "val_loss": 3.6223838329315186, "val_ppl": 37.42668051850112, "is_best": false, "timestamp": "2026-05-05T05:44:04.198255"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 86000, "epoch": 0, "val_loss": 3.662233901023865, "val_ppl": 38.94825230235286, "is_best": false, "timestamp": "2026-05-05T05:47:32.314224"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 86500, "epoch": 0, "val_loss": 3.6114082098007203, "val_ppl": 37.01814544275634, "is_best": false, "timestamp": "2026-05-05T05:51:01.125909"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 87000, "epoch": 0, "val_loss": 3.571852457523346, "val_ppl": 35.582447108813014, "is_best": false, "timestamp": "2026-05-05T05:54:29.829229"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 87500, "epoch": 0, "val_loss": 3.487281250953674, "val_ppl": 32.69693200268292, "is_best": true, "timestamp": "2026-05-05T05:57:59.390664"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 88000, "epoch": 0, "val_loss": 3.5826083183288575, "val_ppl": 35.96723259701156, "is_best": false, "timestamp": "2026-05-05T06:01:29.039685"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 88500, "epoch": 0, "val_loss": 3.3613099455833435, "val_ppl": 28.826927863984967, "is_best": true, "timestamp": "2026-05-05T06:04:58.135293"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 89000, "epoch": 0, "val_loss": 3.720856249332428, "val_ppl": 41.29974184959951, "is_best": false, "timestamp": "2026-05-05T06:08:27.479708"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 89500, "epoch": 0, "val_loss": 3.411408472061157, "val_ppl": 30.307902044460747, "is_best": false, "timestamp": "2026-05-05T06:11:56.256241"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 90000, "epoch": 0, "val_loss": 3.502420389652252, "val_ppl": 33.19570133414478, "is_best": false, "timestamp": "2026-05-05T06:15:23.843460"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 90500, "epoch": 0, "val_loss": 3.470740056037903, "val_ppl": 32.16053423758203, "is_best": false, "timestamp": "2026-05-05T06:18:52.013161"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 91000, "epoch": 0, "val_loss": 3.6083788871765137, "val_ppl": 36.90617521985247, "is_best": false, "timestamp": "2026-05-05T06:22:20.694699"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 91500, "epoch": 0, "val_loss": 3.5298542261123655, "val_ppl": 34.11899359388364, "is_best": false, "timestamp": "2026-05-05T06:25:49.341306"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 92000, "epoch": 0, "val_loss": 3.536409044265747, "val_ppl": 34.34337196881105, "is_best": false, "timestamp": "2026-05-05T06:29:17.886483"} {"run_name": "c2", "stage": "pretraining", "event": "eval", "step": 92500, "epoch": 0, "val_loss": 3.567478024959564, "val_ppl": 35.42713404441251, "is_best": false, "timestamp": "2026-05-05T06:32:46.611475"}