{"run_name": "c2", "stage": "pretraining", "event": "model_summary", "total_params": 38227520, "trainable_params": 38227520, "weight_tied_lm_head": true, "timestamp": "2026-05-04T20:51:34.748590"} {"run_name": "c2", "stage": "pretraining", "event": "config", "model": {"vocab_size": 50304, "n_layers": 18, "n_heads": 5, "n_kv_heads": 1, "n_embd": 320, "embedding_dim": null, "tie_embeddings": true, "context_len": 1024, "dropout": 0.0, "bias": false, "norm_type": "rmsnorm", "norm_eps": 1e-05, "positional_embedding": "rope", "rope_theta": 10000.0, "rope_fraction": 1.0, "mlp_type": "swiglu", "mlp_hidden_mult": 4.0, "mlp_hidden_dim": 1024, "qk_norm": false, "block_style": "sequential"}, "training": {"seed": 0, "learning_rate": 0.0012, "min_lr": 0.00012, "weight_decay": 0.03, "beta1": 0.9, "beta2": 0.95, "grad_clip": 1.0, "max_iters": 11586, "warmup_steps": 116, "lr_schedule": "wsd", "wsd_stable_frac": 0.85, "batch_size": 4, "gradient_accumulation_steps": 16, "dtype": "float16", "device": "cuda", "eval_step_interval": 500, "eval_batches": 20, "log_interval": 10, "max_checkpoints": 5}, "distributed": {"enabled": false, "backend": "nccl"}, "timestamp": "2026-05-04T20:51:34.748853"} {"run_name": "c2", "stage": "pretraining", "event": "model_summary", "total_params": 38227520, "trainable_params": 38227520, "weight_tied_lm_head": true, "timestamp": "2026-05-04T20:55:51.114602"} {"run_name": "c2", "stage": "pretraining", "event": "config", "model": {"vocab_size": 50304, "n_layers": 18, "n_heads": 5, "n_kv_heads": 1, "n_embd": 320, "embedding_dim": null, "tie_embeddings": true, "context_len": 1024, "dropout": 0.0, "bias": false, "norm_type": "rmsnorm", "norm_eps": 1e-05, "positional_embedding": "rope", "rope_theta": 10000.0, "rope_fraction": 1.0, "mlp_type": "swiglu", "mlp_hidden_mult": 4.0, "mlp_hidden_dim": 1024, "qk_norm": false, "block_style": "sequential"}, "training": {"seed": 0, "learning_rate": 0.0012, "min_lr": 0.00012, "weight_decay": 0.03, "beta1": 0.9, "beta2": 0.95, "grad_clip": 1.0, "max_iters": 92685, "warmup_steps": 116, "lr_schedule": "wsd", "wsd_stable_frac": 0.85, "batch_size": 4, "gradient_accumulation_steps": 16, "dtype": "float16", "device": "cuda", "eval_step_interval": 500, "eval_batches": 20, "log_interval": 10, "max_checkpoints": 5}, "distributed": {"enabled": false, "backend": "nccl"}, "timestamp": "2026-05-04T20:55:51.114804"} {"run_name": "c2", "stage": "pretraining", "event": "resume", "checkpoint": "artifacts/c2/checkpoints/ckpt_step0011586.pt", "step": 11586, "best_val_loss": 3.8527660250663756, "timestamp": "2026-05-04T20:55:51.578050"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 12000, "path": "artifacts/c2/checkpoints/ckpt_step0012000.pt", "timestamp": "2026-05-04T21:00:00.110473"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 12500, "path": "artifacts/c2/checkpoints/ckpt_step0012500.pt", "timestamp": "2026-05-04T21:03:40.818712"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 13000, "path": "artifacts/c2/checkpoints/ckpt_step0013000.pt", "timestamp": "2026-05-04T21:07:21.158528"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 13500, "path": "artifacts/c2/checkpoints/ckpt_step0013500.pt", "timestamp": "2026-05-04T21:11:00.953139"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 14000, "path": "artifacts/c2/checkpoints/ckpt_step0014000.pt", "timestamp": "2026-05-04T21:14:41.734550"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 14500, "path": "artifacts/c2/checkpoints/ckpt_step0014500.pt", "timestamp": "2026-05-04T21:18:22.458649"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 14500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:18:23.064434"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 15000, "path": "artifacts/c2/checkpoints/ckpt_step0015000.pt", "timestamp": "2026-05-04T21:22:00.340468"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 15500, "path": "artifacts/c2/checkpoints/ckpt_step0015500.pt", "timestamp": "2026-05-04T21:25:36.621906"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 16000, "path": "artifacts/c2/checkpoints/ckpt_step0016000.pt", "timestamp": "2026-05-04T21:29:12.590050"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 16500, "path": "artifacts/c2/checkpoints/ckpt_step0016500.pt", "timestamp": "2026-05-04T21:32:50.330606"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 17000, "path": "artifacts/c2/checkpoints/ckpt_step0017000.pt", "timestamp": "2026-05-04T21:36:28.262577"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 17500, "path": "artifacts/c2/checkpoints/ckpt_step0017500.pt", "timestamp": "2026-05-04T21:40:04.551108"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 18000, "path": "artifacts/c2/checkpoints/ckpt_step0018000.pt", "timestamp": "2026-05-04T21:43:40.067927"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 18500, "path": "artifacts/c2/checkpoints/ckpt_step0018500.pt", "timestamp": "2026-05-04T21:47:16.668622"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 18500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:47:17.560815"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 19000, "path": "artifacts/c2/checkpoints/ckpt_step0019000.pt", "timestamp": "2026-05-04T21:50:52.991139"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 19000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:50:53.852840"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 19500, "path": "artifacts/c2/checkpoints/ckpt_step0019500.pt", "timestamp": "2026-05-04T21:54:30.514043"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 20000, "path": "artifacts/c2/checkpoints/ckpt_step0020000.pt", "timestamp": "2026-05-04T21:58:06.244586"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 20000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:58:07.169029"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 20500, "path": "artifacts/c2/checkpoints/ckpt_step0020500.pt", "timestamp": "2026-05-04T22:01:42.547664"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 21000, "path": "artifacts/c2/checkpoints/ckpt_step0021000.pt", "timestamp": "2026-05-04T22:05:18.903445"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 21500, "path": "artifacts/c2/checkpoints/ckpt_step0021500.pt", "timestamp": "2026-05-04T22:08:54.759245"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 22000, "path": "artifacts/c2/checkpoints/ckpt_step0022000.pt", "timestamp": "2026-05-04T22:12:35.490777"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 22500, "path": "artifacts/c2/checkpoints/ckpt_step0022500.pt", "timestamp": "2026-05-04T22:16:16.910153"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 23000, "path": "artifacts/c2/checkpoints/ckpt_step0023000.pt", "timestamp": "2026-05-04T22:19:57.275761"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 23500, "path": "artifacts/c2/checkpoints/ckpt_step0023500.pt", "timestamp": "2026-05-04T22:23:37.733214"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 23500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:23:38.692307"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 24000, "path": "artifacts/c2/checkpoints/ckpt_step0024000.pt", "timestamp": "2026-05-04T22:27:14.462120"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 24500, "path": "artifacts/c2/checkpoints/ckpt_step0024500.pt", "timestamp": "2026-05-04T22:30:50.186765"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 24500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:30:51.110454"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 25000, "path": "artifacts/c2/checkpoints/ckpt_step0025000.pt", "timestamp": "2026-05-04T22:34:26.435459"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 25500, "path": "artifacts/c2/checkpoints/ckpt_step0025500.pt", "timestamp": "2026-05-04T22:38:01.616826"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 26000, "path": "artifacts/c2/checkpoints/ckpt_step0026000.pt", "timestamp": "2026-05-04T22:41:36.171027"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 26500, "path": "artifacts/c2/checkpoints/ckpt_step0026500.pt", "timestamp": "2026-05-04T22:45:12.480833"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 27000, "path": "artifacts/c2/checkpoints/ckpt_step0027000.pt", "timestamp": "2026-05-04T22:48:49.630829"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 27500, "path": "artifacts/c2/checkpoints/ckpt_step0027500.pt", "timestamp": "2026-05-04T22:52:23.987911"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 28000, "path": "artifacts/c2/checkpoints/ckpt_step0028000.pt", "timestamp": "2026-05-04T22:55:57.996561"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 28500, "path": "artifacts/c2/checkpoints/ckpt_step0028500.pt", "timestamp": "2026-05-04T22:59:35.749865"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 29000, "path": "artifacts/c2/checkpoints/ckpt_step0029000.pt", "timestamp": "2026-05-04T23:03:12.706823"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 29500, "path": "artifacts/c2/checkpoints/ckpt_step0029500.pt", "timestamp": "2026-05-04T23:06:47.965913"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 29500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T23:06:48.838561"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 30000, "path": "artifacts/c2/checkpoints/ckpt_step0030000.pt", "timestamp": "2026-05-04T23:10:24.061996"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 30500, "path": "artifacts/c2/checkpoints/ckpt_step0030500.pt", "timestamp": "2026-05-04T23:13:58.988561"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 31000, "path": "artifacts/c2/checkpoints/ckpt_step0031000.pt", "timestamp": "2026-05-04T23:17:34.697407"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 31500, "path": "artifacts/c2/checkpoints/ckpt_step0031500.pt", "timestamp": "2026-05-04T23:21:09.933172"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 32000, "path": "artifacts/c2/checkpoints/ckpt_step0032000.pt", "timestamp": "2026-05-04T23:24:45.779797"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 32500, "path": "artifacts/c2/checkpoints/ckpt_step0032500.pt", "timestamp": "2026-05-04T23:28:20.241536"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 33000, "path": "artifacts/c2/checkpoints/ckpt_step0033000.pt", "timestamp": "2026-05-04T23:31:55.169163"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 33500, "path": "artifacts/c2/checkpoints/ckpt_step0033500.pt", "timestamp": "2026-05-04T23:35:31.951568"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 34000, "path": "artifacts/c2/checkpoints/ckpt_step0034000.pt", "timestamp": "2026-05-04T23:39:07.554608"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 34500, "path": "artifacts/c2/checkpoints/ckpt_step0034500.pt", "timestamp": "2026-05-04T23:42:45.963040"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 35000, "path": "artifacts/c2/checkpoints/ckpt_step0035000.pt", "timestamp": "2026-05-04T23:46:23.037806"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 35500, "path": "artifacts/c2/checkpoints/ckpt_step0035500.pt", "timestamp": "2026-05-04T23:50:01.391079"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 36000, "path": "artifacts/c2/checkpoints/ckpt_step0036000.pt", "timestamp": "2026-05-04T23:53:39.123535"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 36500, "path": "artifacts/c2/checkpoints/ckpt_step0036500.pt", "timestamp": "2026-05-04T23:57:15.042471"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 36500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T23:57:15.986028"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 37000, "path": "artifacts/c2/checkpoints/ckpt_step0037000.pt", "timestamp": "2026-05-05T00:00:52.397532"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 37500, "path": "artifacts/c2/checkpoints/ckpt_step0037500.pt", "timestamp": "2026-05-05T00:04:28.488179"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 37500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:04:29.328242"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 38000, "path": "artifacts/c2/checkpoints/ckpt_step0038000.pt", "timestamp": "2026-05-05T00:08:04.476478"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 38500, "path": "artifacts/c2/checkpoints/ckpt_step0038500.pt", "timestamp": "2026-05-05T00:11:39.556054"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 39000, "path": "artifacts/c2/checkpoints/ckpt_step0039000.pt", "timestamp": "2026-05-05T00:15:14.254304"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 39500, "path": "artifacts/c2/checkpoints/ckpt_step0039500.pt", "timestamp": "2026-05-05T00:18:48.741599"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 40000, "path": "artifacts/c2/checkpoints/ckpt_step0040000.pt", "timestamp": "2026-05-05T00:22:23.329858"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 40500, "path": "artifacts/c2/checkpoints/ckpt_step0040500.pt", "timestamp": "2026-05-05T00:25:58.324698"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 41000, "path": "artifacts/c2/checkpoints/ckpt_step0041000.pt", "timestamp": "2026-05-05T00:29:33.613999"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 41000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:29:34.493359"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 41500, "path": "artifacts/c2/checkpoints/ckpt_step0041500.pt", "timestamp": "2026-05-05T00:33:09.011262"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 42000, "path": "artifacts/c2/checkpoints/ckpt_step0042000.pt", "timestamp": "2026-05-05T00:36:43.234279"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 42500, "path": "artifacts/c2/checkpoints/ckpt_step0042500.pt", "timestamp": "2026-05-05T00:40:17.669807"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 43000, "path": "artifacts/c2/checkpoints/ckpt_step0043000.pt", "timestamp": "2026-05-05T00:43:52.501341"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 43500, "path": "artifacts/c2/checkpoints/ckpt_step0043500.pt", "timestamp": "2026-05-05T00:47:27.576226"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 44000, "path": "artifacts/c2/checkpoints/ckpt_step0044000.pt", "timestamp": "2026-05-05T00:51:05.492518"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 44500, "path": "artifacts/c2/checkpoints/ckpt_step0044500.pt", "timestamp": "2026-05-05T00:54:41.107238"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 45000, "path": "artifacts/c2/checkpoints/ckpt_step0045000.pt", "timestamp": "2026-05-05T00:58:18.115880"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 45500, "path": "artifacts/c2/checkpoints/ckpt_step0045500.pt", "timestamp": "2026-05-05T01:01:55.098593"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 46000, "path": "artifacts/c2/checkpoints/ckpt_step0046000.pt", "timestamp": "2026-05-05T01:05:28.750126"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 46500, "path": "artifacts/c2/checkpoints/ckpt_step0046500.pt", "timestamp": "2026-05-05T01:09:02.610840"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 47000, "path": "artifacts/c2/checkpoints/ckpt_step0047000.pt", "timestamp": "2026-05-05T01:12:35.776226"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 47500, "path": "artifacts/c2/checkpoints/ckpt_step0047500.pt", "timestamp": "2026-05-05T01:16:08.472641"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 48000, "path": "artifacts/c2/checkpoints/ckpt_step0048000.pt", "timestamp": "2026-05-05T01:19:42.326766"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 48500, "path": "artifacts/c2/checkpoints/ckpt_step0048500.pt", "timestamp": "2026-05-05T01:23:15.584520"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 49000, "path": "artifacts/c2/checkpoints/ckpt_step0049000.pt", "timestamp": "2026-05-05T01:26:49.541401"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 49500, "path": "artifacts/c2/checkpoints/ckpt_step0049500.pt", "timestamp": "2026-05-05T01:30:22.798284"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 50000, "path": "artifacts/c2/checkpoints/ckpt_step0050000.pt", "timestamp": "2026-05-05T01:33:56.893241"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 50500, "path": "artifacts/c2/checkpoints/ckpt_step0050500.pt", "timestamp": "2026-05-05T01:37:30.457284"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 51000, "path": "artifacts/c2/checkpoints/ckpt_step0051000.pt", "timestamp": "2026-05-05T01:41:04.277657"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 51500, "path": "artifacts/c2/checkpoints/ckpt_step0051500.pt", "timestamp": "2026-05-05T01:44:37.249519"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 52000, "path": "artifacts/c2/checkpoints/ckpt_step0052000.pt", "timestamp": "2026-05-05T01:48:11.602737"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 52500, "path": "artifacts/c2/checkpoints/ckpt_step0052500.pt", "timestamp": "2026-05-05T01:51:45.550140"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 53000, "path": "artifacts/c2/checkpoints/ckpt_step0053000.pt", "timestamp": "2026-05-05T01:55:20.569368"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 53000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T01:55:21.509022"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 53500, "path": "artifacts/c2/checkpoints/ckpt_step0053500.pt", "timestamp": "2026-05-05T01:58:56.759123"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 54000, "path": "artifacts/c2/checkpoints/ckpt_step0054000.pt", "timestamp": "2026-05-05T02:02:37.198236"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 54000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T02:02:38.124472"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 54500, "path": "artifacts/c2/checkpoints/ckpt_step0054500.pt", "timestamp": "2026-05-05T02:06:14.593044"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 55000, "path": "artifacts/c2/checkpoints/ckpt_step0055000.pt", "timestamp": "2026-05-05T02:09:50.577235"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 55500, "path": "artifacts/c2/checkpoints/ckpt_step0055500.pt", "timestamp": "2026-05-05T02:13:25.929470"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 56000, "path": "artifacts/c2/checkpoints/ckpt_step0056000.pt", "timestamp": "2026-05-05T02:17:01.005635"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 56500, "path": "artifacts/c2/checkpoints/ckpt_step0056500.pt", "timestamp": "2026-05-05T02:20:35.058409"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 57000, "path": "artifacts/c2/checkpoints/ckpt_step0057000.pt", "timestamp": "2026-05-05T02:24:09.182984"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 57500, "path": "artifacts/c2/checkpoints/ckpt_step0057500.pt", "timestamp": "2026-05-05T02:27:43.001859"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 58000, "path": "artifacts/c2/checkpoints/ckpt_step0058000.pt", "timestamp": "2026-05-05T02:31:16.149978"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 58500, "path": "artifacts/c2/checkpoints/ckpt_step0058500.pt", "timestamp": "2026-05-05T02:34:50.291544"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 59000, "path": "artifacts/c2/checkpoints/ckpt_step0059000.pt", "timestamp": "2026-05-05T02:38:24.555747"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 59500, "path": "artifacts/c2/checkpoints/ckpt_step0059500.pt", "timestamp": "2026-05-05T02:41:58.967242"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 60000, "path": "artifacts/c2/checkpoints/ckpt_step0060000.pt", "timestamp": "2026-05-05T02:45:33.668284"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 60500, "path": "artifacts/c2/checkpoints/ckpt_step0060500.pt", "timestamp": "2026-05-05T02:49:07.661930"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 61000, "path": "artifacts/c2/checkpoints/ckpt_step0061000.pt", "timestamp": "2026-05-05T02:52:42.478664"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 61500, "path": "artifacts/c2/checkpoints/ckpt_step0061500.pt", "timestamp": "2026-05-05T02:56:18.138931"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 62000, "path": "artifacts/c2/checkpoints/ckpt_step0062000.pt", "timestamp": "2026-05-05T02:59:52.909119"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 62500, "path": "artifacts/c2/checkpoints/ckpt_step0062500.pt", "timestamp": "2026-05-05T03:03:28.146235"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 63000, "path": "artifacts/c2/checkpoints/ckpt_step0063000.pt", "timestamp": "2026-05-05T03:07:02.081683"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 63000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T03:07:02.997468"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 63500, "path": "artifacts/c2/checkpoints/ckpt_step0063500.pt", "timestamp": "2026-05-05T03:10:40.623001"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 64000, "path": "artifacts/c2/checkpoints/ckpt_step0064000.pt", "timestamp": "2026-05-05T03:14:10.206324"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 64500, "path": "artifacts/c2/checkpoints/ckpt_step0064500.pt", "timestamp": "2026-05-05T03:17:40.773151"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 65000, "path": "artifacts/c2/checkpoints/ckpt_step0065000.pt", "timestamp": "2026-05-05T03:21:10.271135"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 65500, "path": "artifacts/c2/checkpoints/ckpt_step0065500.pt", "timestamp": "2026-05-05T03:24:39.893399"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 66000, "path": "artifacts/c2/checkpoints/ckpt_step0066000.pt", "timestamp": "2026-05-05T03:28:10.440559"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 66500, "path": "artifacts/c2/checkpoints/ckpt_step0066500.pt", "timestamp": "2026-05-05T03:31:41.292818"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 67000, "path": "artifacts/c2/checkpoints/ckpt_step0067000.pt", "timestamp": "2026-05-05T03:35:11.743968"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 67500, "path": "artifacts/c2/checkpoints/ckpt_step0067500.pt", "timestamp": "2026-05-05T03:38:41.753218"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 68000, "path": "artifacts/c2/checkpoints/ckpt_step0068000.pt", "timestamp": "2026-05-05T03:42:11.607967"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 68500, "path": "artifacts/c2/checkpoints/ckpt_step0068500.pt", "timestamp": "2026-05-05T03:45:40.732238"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 69000, "path": "artifacts/c2/checkpoints/ckpt_step0069000.pt", "timestamp": "2026-05-05T03:49:09.216500"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 69500, "path": "artifacts/c2/checkpoints/ckpt_step0069500.pt", "timestamp": "2026-05-05T03:52:38.451307"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 70000, "path": "artifacts/c2/checkpoints/ckpt_step0070000.pt", "timestamp": "2026-05-05T03:56:07.767576"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 70500, "path": "artifacts/c2/checkpoints/ckpt_step0070500.pt", "timestamp": "2026-05-05T03:59:36.145726"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 71000, "path": "artifacts/c2/checkpoints/ckpt_step0071000.pt", "timestamp": "2026-05-05T04:03:05.144792"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 71500, "path": "artifacts/c2/checkpoints/ckpt_step0071500.pt", "timestamp": "2026-05-05T04:06:34.400719"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 72000, "path": "artifacts/c2/checkpoints/ckpt_step0072000.pt", "timestamp": "2026-05-05T04:10:03.602582"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 72500, "path": "artifacts/c2/checkpoints/ckpt_step0072500.pt", "timestamp": "2026-05-05T04:13:33.400362"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 73000, "path": "artifacts/c2/checkpoints/ckpt_step0073000.pt", "timestamp": "2026-05-05T04:17:02.914126"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 73500, "path": "artifacts/c2/checkpoints/ckpt_step0073500.pt", "timestamp": "2026-05-05T04:20:32.300875"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 74000, "path": "artifacts/c2/checkpoints/ckpt_step0074000.pt", "timestamp": "2026-05-05T04:24:02.049636"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 74500, "path": "artifacts/c2/checkpoints/ckpt_step0074500.pt", "timestamp": "2026-05-05T04:27:31.200827"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 75000, "path": "artifacts/c2/checkpoints/ckpt_step0075000.pt", "timestamp": "2026-05-05T04:31:00.636999"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 75500, "path": "artifacts/c2/checkpoints/ckpt_step0075500.pt", "timestamp": "2026-05-05T04:34:29.719933"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 76000, "path": "artifacts/c2/checkpoints/ckpt_step0076000.pt", "timestamp": "2026-05-05T04:37:59.679950"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 76500, "path": "artifacts/c2/checkpoints/ckpt_step0076500.pt", "timestamp": "2026-05-05T04:41:29.125304"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 77000, "path": "artifacts/c2/checkpoints/ckpt_step0077000.pt", "timestamp": "2026-05-05T04:44:58.189302"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 77500, "path": "artifacts/c2/checkpoints/ckpt_step0077500.pt", "timestamp": "2026-05-05T04:48:27.045411"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 78000, "path": "artifacts/c2/checkpoints/ckpt_step0078000.pt", "timestamp": "2026-05-05T04:51:55.803709"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 78500, "path": "artifacts/c2/checkpoints/ckpt_step0078500.pt", "timestamp": "2026-05-05T04:55:24.816039"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 79000, "path": "artifacts/c2/checkpoints/ckpt_step0079000.pt", "timestamp": "2026-05-05T04:58:53.749490"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 79500, "path": "artifacts/c2/checkpoints/ckpt_step0079500.pt", "timestamp": "2026-05-05T05:02:23.187466"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 80000, "path": "artifacts/c2/checkpoints/ckpt_step0080000.pt", "timestamp": "2026-05-05T05:05:51.789635"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 80500, "path": "artifacts/c2/checkpoints/ckpt_step0080500.pt", "timestamp": "2026-05-05T05:09:20.988700"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 81000, "path": "artifacts/c2/checkpoints/ckpt_step0081000.pt", "timestamp": "2026-05-05T05:12:50.742366"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 81500, "path": "artifacts/c2/checkpoints/ckpt_step0081500.pt", "timestamp": "2026-05-05T05:16:18.314073"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 82000, "path": "artifacts/c2/checkpoints/ckpt_step0082000.pt", "timestamp": "2026-05-05T05:19:45.731644"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 82500, "path": "artifacts/c2/checkpoints/ckpt_step0082500.pt", "timestamp": "2026-05-05T05:23:13.590769"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 83000, "path": "artifacts/c2/checkpoints/ckpt_step0083000.pt", "timestamp": "2026-05-05T05:26:41.488695"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 83500, "path": "artifacts/c2/checkpoints/ckpt_step0083500.pt", "timestamp": "2026-05-05T05:30:10.015029"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 84000, "path": "artifacts/c2/checkpoints/ckpt_step0084000.pt", "timestamp": "2026-05-05T05:33:38.459867"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 84500, "path": "artifacts/c2/checkpoints/ckpt_step0084500.pt", "timestamp": "2026-05-05T05:37:07.695034"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 85000, "path": "artifacts/c2/checkpoints/ckpt_step0085000.pt", "timestamp": "2026-05-05T05:40:35.566712"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 85500, "path": "artifacts/c2/checkpoints/ckpt_step0085500.pt", "timestamp": "2026-05-05T05:44:04.855637"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 86000, "path": "artifacts/c2/checkpoints/ckpt_step0086000.pt", "timestamp": "2026-05-05T05:47:32.968873"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 86500, "path": "artifacts/c2/checkpoints/ckpt_step0086500.pt", "timestamp": "2026-05-05T05:51:01.778350"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 87000, "path": "artifacts/c2/checkpoints/ckpt_step0087000.pt", "timestamp": "2026-05-05T05:54:30.481515"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 87500, "path": "artifacts/c2/checkpoints/ckpt_step0087500.pt", "timestamp": "2026-05-05T05:58:00.050529"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 87500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T05:58:00.987741"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 88000, "path": "artifacts/c2/checkpoints/ckpt_step0088000.pt", "timestamp": "2026-05-05T06:01:29.694602"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 88500, "path": "artifacts/c2/checkpoints/ckpt_step0088500.pt", "timestamp": "2026-05-05T06:04:58.783944"} {"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 88500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T06:04:59.598538"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 89000, "path": "artifacts/c2/checkpoints/ckpt_step0089000.pt", "timestamp": "2026-05-05T06:08:28.132788"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 89500, "path": "artifacts/c2/checkpoints/ckpt_step0089500.pt", "timestamp": "2026-05-05T06:11:56.919763"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 90000, "path": "artifacts/c2/checkpoints/ckpt_step0090000.pt", "timestamp": "2026-05-05T06:15:24.500092"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 90500, "path": "artifacts/c2/checkpoints/ckpt_step0090500.pt", "timestamp": "2026-05-05T06:18:52.669982"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 91000, "path": "artifacts/c2/checkpoints/ckpt_step0091000.pt", "timestamp": "2026-05-05T06:22:21.345356"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 91500, "path": "artifacts/c2/checkpoints/ckpt_step0091500.pt", "timestamp": "2026-05-05T06:25:49.995493"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 92000, "path": "artifacts/c2/checkpoints/ckpt_step0092000.pt", "timestamp": "2026-05-05T06:29:18.544358"} {"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 92500, "path": "artifacts/c2/checkpoints/ckpt_step0092500.pt", "timestamp": "2026-05-05T06:32:47.267711"} {"run_name": "c2", "stage": "pretraining", "event": "final_checkpoint_saved", "step": 92685, "path": "artifacts/c2/checkpoints/ckpt_step0092685.pt", "best_val_loss_so_far": 3.3613099455833435, "timestamp": "2026-05-05T06:34:04.509790"} {"run_name": "c2", "stage": "pretraining", "event": "metrics_plot_saved", "path": "artifacts/c2/metrics.png", "timestamp": "2026-05-05T06:34:06.673898"} {"run_name": "c2", "stage": "pretraining", "event": "results_doc_saved", "path": "artifacts/c2/results.md", "timestamp": "2026-05-05T06:34:06.674076"}