{"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "model_summary", "total_params": 39600320, "trainable_params": 39600320, "weight_tied_lm_head": true, "timestamp": "2026-05-04T20:23:12.168209"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "config", "model": {"vocab_size": 50304, "n_layers": 18, "n_heads": 7, "n_kv_heads": 1, "n_embd": 448, "embedding_dim": 128, "tie_embeddings": true, "context_len": 1024, "dropout": 0.0, "bias": false, "norm_type": "rmsnorm", "norm_eps": 1e-05, "positional_embedding": "rope", "rope_theta": 10000.0, "rope_fraction": 1.0, "mlp_type": "swiglu", "mlp_hidden_mult": 4.0, "mlp_hidden_dim": 1024, "qk_norm": false, "block_style": "sequential"}, "training": {"seed": 0, "learning_rate": 0.00056, "min_lr": 5.6e-05, "weight_decay": 0.03, "beta1": 0.9, "beta2": 0.95, "grad_clip": 1.0, "max_iters": 92686, "warmup_steps": 927, "lr_schedule": "wsd", "wsd_stable_frac": 0.85, "batch_size": 4, "gradient_accumulation_steps": 16, "dtype": "float16", "device": "cuda", "eval_step_interval": 500, "eval_batches": 20, "log_interval": 10, "max_checkpoints": 5}, "distributed": {"enabled": false, "backend": "nccl"}, "timestamp": "2026-05-04T20:23:12.168449"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0000500.pt", "timestamp": "2026-05-04T20:27:55.142009"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:27:55.674592"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 1000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0001000.pt", "timestamp": "2026-05-04T20:31:37.784420"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 1000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:31:39.079554"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 1500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0001500.pt", "timestamp": "2026-05-04T20:35:21.748891"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 1500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:35:22.495767"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 2000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0002000.pt", "timestamp": "2026-05-04T20:39:05.235280"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 2000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:39:06.079682"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 2500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0002500.pt", "timestamp": "2026-05-04T20:42:49.397222"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 2500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:42:50.184288"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 3000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0003000.pt", "timestamp": "2026-05-04T20:46:32.806904"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 3000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:46:33.663517"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 3500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0003500.pt", "timestamp": "2026-05-04T20:50:17.256089"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 3500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:50:17.991782"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 4000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0004000.pt", "timestamp": "2026-05-04T20:54:01.211358"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 4000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:54:02.040620"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 4500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0004500.pt", "timestamp": "2026-05-04T20:57:45.611498"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 4500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T20:57:46.435646"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 5000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0005000.pt", "timestamp": "2026-05-04T21:01:30.398224"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 5000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:01:31.268647"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 5500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0005500.pt", "timestamp": "2026-05-04T21:05:14.470089"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 6000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0006000.pt", "timestamp": "2026-05-04T21:09:00.046189"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 6000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:09:00.910129"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 6500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0006500.pt", "timestamp": "2026-05-04T21:12:45.525830"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 6500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:12:46.240077"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 7000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0007000.pt", "timestamp": "2026-05-04T21:16:30.762666"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 7000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:16:31.487818"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 7500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0007500.pt", "timestamp": "2026-05-04T21:20:15.466466"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 8000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0008000.pt", "timestamp": "2026-05-04T21:23:59.541998"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 8500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0008500.pt", "timestamp": "2026-05-04T21:27:42.146634"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 8500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:27:43.006611"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 9000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0009000.pt", "timestamp": "2026-05-04T21:31:26.420950"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 9000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:31:27.199869"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 9500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0009500.pt", "timestamp": "2026-05-04T21:35:10.308016"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 10000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0010000.pt", "timestamp": "2026-05-04T21:38:53.645793"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 10500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0010500.pt", "timestamp": "2026-05-04T21:42:37.288633"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 11000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0011000.pt", "timestamp": "2026-05-04T21:46:21.254017"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 11500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0011500.pt", "timestamp": "2026-05-04T21:50:04.813045"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 12000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0012000.pt", "timestamp": "2026-05-04T21:53:48.282459"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 12000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:53:49.142946"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 12500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0012500.pt", "timestamp": "2026-05-04T21:57:33.671171"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 12500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:57:34.499659"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 13000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0013000.pt", "timestamp": "2026-05-04T22:01:17.566365"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 13000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:01:18.348870"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 13500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0013500.pt", "timestamp": "2026-05-04T22:05:02.478445"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 14000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0014000.pt", "timestamp": "2026-05-04T22:08:48.864326"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 14000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:08:49.694977"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 14500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0014500.pt", "timestamp": "2026-05-04T22:12:35.376898"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 15000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0015000.pt", "timestamp": "2026-05-04T22:16:18.886662"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 15500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0015500.pt", "timestamp": "2026-05-04T22:20:02.473041"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 16000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0016000.pt", "timestamp": "2026-05-04T22:23:46.768017"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 16500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0016500.pt", "timestamp": "2026-05-04T22:27:30.730754"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 17000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0017000.pt", "timestamp": "2026-05-04T22:31:13.461759"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 17500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0017500.pt", "timestamp": "2026-05-04T22:34:57.513738"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 17500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:34:58.366234"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 18000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0018000.pt", "timestamp": "2026-05-04T22:38:42.642444"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 18500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0018500.pt", "timestamp": "2026-05-04T22:42:26.155660"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 18500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:42:26.989819"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 19000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0019000.pt", "timestamp": "2026-05-04T22:46:10.970413"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 19500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0019500.pt", "timestamp": "2026-05-04T22:49:54.141197"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 20000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0020000.pt", "timestamp": "2026-05-04T22:53:36.432026"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 20500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0020500.pt", "timestamp": "2026-05-04T22:57:19.755532"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 21000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0021000.pt", "timestamp": "2026-05-04T23:01:02.902949"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 21500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0021500.pt", "timestamp": "2026-05-04T23:04:46.134141"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 22000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0022000.pt", "timestamp": "2026-05-04T23:08:28.289934"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 22500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0022500.pt", "timestamp": "2026-05-04T23:12:09.084311"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 23000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0023000.pt", "timestamp": "2026-05-04T23:15:49.337428"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 23500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0023500.pt", "timestamp": "2026-05-04T23:19:27.612330"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 23500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T23:19:28.500798"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 24000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0024000.pt", "timestamp": "2026-05-04T23:23:08.327686"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 24500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0024500.pt", "timestamp": "2026-05-04T23:26:48.315534"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 25000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0025000.pt", "timestamp": "2026-05-04T23:30:27.637895"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 25500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0025500.pt", "timestamp": "2026-05-04T23:34:08.369594"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 26000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0026000.pt", "timestamp": "2026-05-04T23:37:48.643020"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 26500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0026500.pt", "timestamp": "2026-05-04T23:41:28.086547"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 27000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0027000.pt", "timestamp": "2026-05-04T23:45:07.427421"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 27500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0027500.pt", "timestamp": "2026-05-04T23:48:47.235165"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 28000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0028000.pt", "timestamp": "2026-05-04T23:52:27.863464"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 28500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0028500.pt", "timestamp": "2026-05-04T23:56:07.434743"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 29000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0029000.pt", "timestamp": "2026-05-04T23:59:47.594114"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 29500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0029500.pt", "timestamp": "2026-05-05T00:03:27.187288"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 30000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0030000.pt", "timestamp": "2026-05-05T00:07:06.850956"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 30500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0030500.pt", "timestamp": "2026-05-05T00:10:46.574964"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 30500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:10:47.367391"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 31000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0031000.pt", "timestamp": "2026-05-05T00:14:27.656088"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 31500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0031500.pt", "timestamp": "2026-05-05T00:18:06.221326"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 31500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:18:06.950297"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 32000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0032000.pt", "timestamp": "2026-05-05T00:21:47.104745"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 32500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0032500.pt", "timestamp": "2026-05-05T00:25:26.563043"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 33000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0033000.pt", "timestamp": "2026-05-05T00:29:05.205611"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 33500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0033500.pt", "timestamp": "2026-05-05T00:32:44.824956"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 34000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0034000.pt", "timestamp": "2026-05-05T00:36:28.060636"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 34500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0034500.pt", "timestamp": "2026-05-05T00:40:12.862947"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 35000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0035000.pt", "timestamp": "2026-05-05T00:43:57.193009"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 35000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:43:58.038836"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 35500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0035500.pt", "timestamp": "2026-05-05T00:47:44.153795"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 36000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0036000.pt", "timestamp": "2026-05-05T00:51:27.226601"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 36500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0036500.pt", "timestamp": "2026-05-05T00:55:08.951275"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 37000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0037000.pt", "timestamp": "2026-05-05T00:58:52.771809"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 37500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0037500.pt", "timestamp": "2026-05-05T01:02:34.694434"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 38000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0038000.pt", "timestamp": "2026-05-05T01:06:17.444903"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 38500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0038500.pt", "timestamp": "2026-05-05T01:09:58.817959"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 39000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0039000.pt", "timestamp": "2026-05-05T01:13:40.692232"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 39500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0039500.pt", "timestamp": "2026-05-05T01:17:24.540333"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 40000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0040000.pt", "timestamp": "2026-05-05T01:21:09.425055"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 40500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0040500.pt", "timestamp": "2026-05-05T01:24:53.777562"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 41000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0041000.pt", "timestamp": "2026-05-05T01:28:40.001870"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 41500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0041500.pt", "timestamp": "2026-05-05T01:32:35.932718"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 42000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0042000.pt", "timestamp": "2026-05-05T01:36:22.039981"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 42500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0042500.pt", "timestamp": "2026-05-05T01:39:58.825436"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 43000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0043000.pt", "timestamp": "2026-05-05T01:43:35.723431"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 43500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0043500.pt", "timestamp": "2026-05-05T01:47:11.869682"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 44000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0044000.pt", "timestamp": "2026-05-05T01:50:48.179937"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 44500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0044500.pt", "timestamp": "2026-05-05T01:54:24.821694"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 45000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0045000.pt", "timestamp": "2026-05-05T01:58:06.137172"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 45500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0045500.pt", "timestamp": "2026-05-05T02:01:45.125545"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 46000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0046000.pt", "timestamp": "2026-05-05T02:05:23.635521"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 46500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0046500.pt", "timestamp": "2026-05-05T02:09:03.114618"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 47000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0047000.pt", "timestamp": "2026-05-05T02:12:41.875799"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 47500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0047500.pt", "timestamp": "2026-05-05T02:16:20.816540"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 48000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0048000.pt", "timestamp": "2026-05-05T02:20:01.557036"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 48000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T02:20:02.417409"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 48500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0048500.pt", "timestamp": "2026-05-05T02:23:56.818047"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 49000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0049000.pt", "timestamp": "2026-05-05T02:27:52.586887"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 49500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0049500.pt", "timestamp": "2026-05-05T02:31:36.694970"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 50000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0050000.pt", "timestamp": "2026-05-05T02:35:19.252969"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 50500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0050500.pt", "timestamp": "2026-05-05T02:39:03.203667"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 51000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0051000.pt", "timestamp": "2026-05-05T02:42:47.148243"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 51500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0051500.pt", "timestamp": "2026-05-05T02:46:32.381090"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 52000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0052000.pt", "timestamp": "2026-05-05T02:50:14.178725"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 52500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0052500.pt", "timestamp": "2026-05-05T02:53:53.819559"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 53000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0053000.pt", "timestamp": "2026-05-05T02:57:33.936652"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 53500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0053500.pt", "timestamp": "2026-05-05T03:01:13.652286"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 54000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0054000.pt", "timestamp": "2026-05-05T03:04:54.105166"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 54500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0054500.pt", "timestamp": "2026-05-05T03:08:33.487983"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 55000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0055000.pt", "timestamp": "2026-05-05T03:12:14.358738"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 55500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0055500.pt", "timestamp": "2026-05-05T03:15:54.254161"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 56000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0056000.pt", "timestamp": "2026-05-05T03:19:33.793544"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 56500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0056500.pt", "timestamp": "2026-05-05T03:23:13.771491"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 57000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0057000.pt", "timestamp": "2026-05-05T03:26:53.469058"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 57000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T03:26:54.341420"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 57500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0057500.pt", "timestamp": "2026-05-05T03:30:33.446072"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 58000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0058000.pt", "timestamp": "2026-05-05T03:34:13.152873"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 58500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0058500.pt", "timestamp": "2026-05-05T03:37:53.327885"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 59000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0059000.pt", "timestamp": "2026-05-05T03:41:32.540956"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 59500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0059500.pt", "timestamp": "2026-05-05T03:45:12.532444"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 60000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0060000.pt", "timestamp": "2026-05-05T03:48:52.226913"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 60500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0060500.pt", "timestamp": "2026-05-05T03:52:31.586998"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 61000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0061000.pt", "timestamp": "2026-05-05T03:56:11.326634"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 61500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0061500.pt", "timestamp": "2026-05-05T03:59:51.203878"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 62000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0062000.pt", "timestamp": "2026-05-05T04:03:30.545906"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 62500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0062500.pt", "timestamp": "2026-05-05T04:07:09.692297"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 63000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0063000.pt", "timestamp": "2026-05-05T04:10:49.106917"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 63500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0063500.pt", "timestamp": "2026-05-05T04:14:29.016982"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 64000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0064000.pt", "timestamp": "2026-05-05T04:18:07.911777"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 64500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0064500.pt", "timestamp": "2026-05-05T04:21:48.475087"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 65000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0065000.pt", "timestamp": "2026-05-05T04:25:28.513958"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 65500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0065500.pt", "timestamp": "2026-05-05T04:29:07.265608"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 66000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0066000.pt", "timestamp": "2026-05-05T04:32:46.847495"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 66500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0066500.pt", "timestamp": "2026-05-05T04:36:24.923896"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 67000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0067000.pt", "timestamp": "2026-05-05T04:40:03.766688"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 67500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0067500.pt", "timestamp": "2026-05-05T04:43:42.041000"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 68000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0068000.pt", "timestamp": "2026-05-05T04:47:27.158883"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 68500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0068500.pt", "timestamp": "2026-05-05T04:51:13.186825"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 69000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0069000.pt", "timestamp": "2026-05-05T04:54:51.573719"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 69500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0069500.pt", "timestamp": "2026-05-05T04:58:32.360592"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 70000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0070000.pt", "timestamp": "2026-05-05T05:02:15.737319"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 70500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0070500.pt", "timestamp": "2026-05-05T05:05:58.407409"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 71000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0071000.pt", "timestamp": "2026-05-05T05:09:50.715130"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 71500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0071500.pt", "timestamp": "2026-05-05T05:13:37.066771"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 72000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0072000.pt", "timestamp": "2026-05-05T05:17:21.731464"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 72500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0072500.pt", "timestamp": "2026-05-05T05:21:04.726329"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 73000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0073000.pt", "timestamp": "2026-05-05T05:24:50.415666"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 73500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0073500.pt", "timestamp": "2026-05-05T05:28:41.057138"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 74000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0074000.pt", "timestamp": "2026-05-05T05:32:27.257197"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 74500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0074500.pt", "timestamp": "2026-05-05T05:36:12.911282"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 75000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0075000.pt", "timestamp": "2026-05-05T05:39:57.344755"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 75500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0075500.pt", "timestamp": "2026-05-05T05:43:37.893156"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 76000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0076000.pt", "timestamp": "2026-05-05T05:47:18.749116"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 76500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0076500.pt", "timestamp": "2026-05-05T05:51:00.211835"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 77000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0077000.pt", "timestamp": "2026-05-05T05:54:40.648385"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 77500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0077500.pt", "timestamp": "2026-05-05T05:58:22.044456"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 78000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0078000.pt", "timestamp": "2026-05-05T06:02:03.752411"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 78500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0078500.pt", "timestamp": "2026-05-05T06:05:44.608926"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 79000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0079000.pt", "timestamp": "2026-05-05T06:09:28.209139"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 79500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0079500.pt", "timestamp": "2026-05-05T06:13:10.261698"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 80000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0080000.pt", "timestamp": "2026-05-05T06:16:52.513796"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 80500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0080500.pt", "timestamp": "2026-05-05T06:20:33.317844"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 81000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0081000.pt", "timestamp": "2026-05-05T06:24:15.152909"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 81500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0081500.pt", "timestamp": "2026-05-05T06:27:55.567231"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 82000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0082000.pt", "timestamp": "2026-05-05T06:31:36.360876"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 82500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0082500.pt", "timestamp": "2026-05-05T06:35:17.554042"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 82500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T06:35:18.435622"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 83000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0083000.pt", "timestamp": "2026-05-05T06:39:00.458592"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 83500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0083500.pt", "timestamp": "2026-05-05T06:42:40.425625"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 84000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0084000.pt", "timestamp": "2026-05-05T06:46:21.367398"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 84500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0084500.pt", "timestamp": "2026-05-05T06:50:02.511036"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 85000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0085000.pt", "timestamp": "2026-05-05T06:53:43.595710"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 85500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0085500.pt", "timestamp": "2026-05-05T06:57:25.241455"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 86000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0086000.pt", "timestamp": "2026-05-05T07:01:05.689244"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 86500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0086500.pt", "timestamp": "2026-05-05T07:04:47.457926"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 87000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0087000.pt", "timestamp": "2026-05-05T07:08:29.630627"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 87000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T07:08:30.499959"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 87500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0087500.pt", "timestamp": "2026-05-05T07:12:12.779069"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 87500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T07:12:13.610148"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 88000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0088000.pt", "timestamp": "2026-05-05T07:15:54.800233"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 88500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0088500.pt", "timestamp": "2026-05-05T07:19:34.729921"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 89000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0089000.pt", "timestamp": "2026-05-05T07:23:16.671092"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 89500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0089500.pt", "timestamp": "2026-05-05T07:26:57.079676"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 90000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0090000.pt", "timestamp": "2026-05-05T07:30:37.571535"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 90500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0090500.pt", "timestamp": "2026-05-05T07:34:17.830813"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 91000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0091000.pt", "timestamp": "2026-05-05T07:37:58.831705"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 91500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0091500.pt", "timestamp": "2026-05-05T07:41:39.322051"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 92000, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0092000.pt", "timestamp": "2026-05-05T07:45:19.858410"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "checkpoint_saved", "step": 92500, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0092500.pt", "timestamp": "2026-05-05T07:49:01.417994"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "final_checkpoint_saved", "step": 92686, "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/checkpoints/ckpt_step0092686.pt", "best_val_loss_so_far": 3.466200029850006, "timestamp": "2026-05-05T07:50:24.812833"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "metrics_plot_saved", "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/metrics.png", "timestamp": "2026-05-05T07:50:26.359232"} {"run_name": "final_c6_18l448_factorized_aggressive", "stage": "pretraining", "event": "results_doc_saved", "path": "artifacts/final_c6/final_c6_18l448_factorized_aggressive/results.md", "timestamp": "2026-05-05T07:50:26.359400"}