fullrun / c2 /events.jsonl
huiting tang
Add files using upload-large-folder tool
9edca3c verified
{"run_name": "c2", "stage": "pretraining", "event": "model_summary", "total_params": 38227520, "trainable_params": 38227520, "weight_tied_lm_head": true, "timestamp": "2026-05-04T20:51:34.748590"}
{"run_name": "c2", "stage": "pretraining", "event": "config", "model": {"vocab_size": 50304, "n_layers": 18, "n_heads": 5, "n_kv_heads": 1, "n_embd": 320, "embedding_dim": null, "tie_embeddings": true, "context_len": 1024, "dropout": 0.0, "bias": false, "norm_type": "rmsnorm", "norm_eps": 1e-05, "positional_embedding": "rope", "rope_theta": 10000.0, "rope_fraction": 1.0, "mlp_type": "swiglu", "mlp_hidden_mult": 4.0, "mlp_hidden_dim": 1024, "qk_norm": false, "block_style": "sequential"}, "training": {"seed": 0, "learning_rate": 0.0012, "min_lr": 0.00012, "weight_decay": 0.03, "beta1": 0.9, "beta2": 0.95, "grad_clip": 1.0, "max_iters": 11586, "warmup_steps": 116, "lr_schedule": "wsd", "wsd_stable_frac": 0.85, "batch_size": 4, "gradient_accumulation_steps": 16, "dtype": "float16", "device": "cuda", "eval_step_interval": 500, "eval_batches": 20, "log_interval": 10, "max_checkpoints": 5}, "distributed": {"enabled": false, "backend": "nccl"}, "timestamp": "2026-05-04T20:51:34.748853"}
{"run_name": "c2", "stage": "pretraining", "event": "model_summary", "total_params": 38227520, "trainable_params": 38227520, "weight_tied_lm_head": true, "timestamp": "2026-05-04T20:55:51.114602"}
{"run_name": "c2", "stage": "pretraining", "event": "config", "model": {"vocab_size": 50304, "n_layers": 18, "n_heads": 5, "n_kv_heads": 1, "n_embd": 320, "embedding_dim": null, "tie_embeddings": true, "context_len": 1024, "dropout": 0.0, "bias": false, "norm_type": "rmsnorm", "norm_eps": 1e-05, "positional_embedding": "rope", "rope_theta": 10000.0, "rope_fraction": 1.0, "mlp_type": "swiglu", "mlp_hidden_mult": 4.0, "mlp_hidden_dim": 1024, "qk_norm": false, "block_style": "sequential"}, "training": {"seed": 0, "learning_rate": 0.0012, "min_lr": 0.00012, "weight_decay": 0.03, "beta1": 0.9, "beta2": 0.95, "grad_clip": 1.0, "max_iters": 92685, "warmup_steps": 116, "lr_schedule": "wsd", "wsd_stable_frac": 0.85, "batch_size": 4, "gradient_accumulation_steps": 16, "dtype": "float16", "device": "cuda", "eval_step_interval": 500, "eval_batches": 20, "log_interval": 10, "max_checkpoints": 5}, "distributed": {"enabled": false, "backend": "nccl"}, "timestamp": "2026-05-04T20:55:51.114804"}
{"run_name": "c2", "stage": "pretraining", "event": "resume", "checkpoint": "artifacts/c2/checkpoints/ckpt_step0011586.pt", "step": 11586, "best_val_loss": 3.8527660250663756, "timestamp": "2026-05-04T20:55:51.578050"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 12000, "path": "artifacts/c2/checkpoints/ckpt_step0012000.pt", "timestamp": "2026-05-04T21:00:00.110473"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 12500, "path": "artifacts/c2/checkpoints/ckpt_step0012500.pt", "timestamp": "2026-05-04T21:03:40.818712"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 13000, "path": "artifacts/c2/checkpoints/ckpt_step0013000.pt", "timestamp": "2026-05-04T21:07:21.158528"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 13500, "path": "artifacts/c2/checkpoints/ckpt_step0013500.pt", "timestamp": "2026-05-04T21:11:00.953139"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 14000, "path": "artifacts/c2/checkpoints/ckpt_step0014000.pt", "timestamp": "2026-05-04T21:14:41.734550"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 14500, "path": "artifacts/c2/checkpoints/ckpt_step0014500.pt", "timestamp": "2026-05-04T21:18:22.458649"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 14500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:18:23.064434"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 15000, "path": "artifacts/c2/checkpoints/ckpt_step0015000.pt", "timestamp": "2026-05-04T21:22:00.340468"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 15500, "path": "artifacts/c2/checkpoints/ckpt_step0015500.pt", "timestamp": "2026-05-04T21:25:36.621906"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 16000, "path": "artifacts/c2/checkpoints/ckpt_step0016000.pt", "timestamp": "2026-05-04T21:29:12.590050"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 16500, "path": "artifacts/c2/checkpoints/ckpt_step0016500.pt", "timestamp": "2026-05-04T21:32:50.330606"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 17000, "path": "artifacts/c2/checkpoints/ckpt_step0017000.pt", "timestamp": "2026-05-04T21:36:28.262577"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 17500, "path": "artifacts/c2/checkpoints/ckpt_step0017500.pt", "timestamp": "2026-05-04T21:40:04.551108"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 18000, "path": "artifacts/c2/checkpoints/ckpt_step0018000.pt", "timestamp": "2026-05-04T21:43:40.067927"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 18500, "path": "artifacts/c2/checkpoints/ckpt_step0018500.pt", "timestamp": "2026-05-04T21:47:16.668622"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 18500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:47:17.560815"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 19000, "path": "artifacts/c2/checkpoints/ckpt_step0019000.pt", "timestamp": "2026-05-04T21:50:52.991139"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 19000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:50:53.852840"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 19500, "path": "artifacts/c2/checkpoints/ckpt_step0019500.pt", "timestamp": "2026-05-04T21:54:30.514043"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 20000, "path": "artifacts/c2/checkpoints/ckpt_step0020000.pt", "timestamp": "2026-05-04T21:58:06.244586"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 20000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T21:58:07.169029"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 20500, "path": "artifacts/c2/checkpoints/ckpt_step0020500.pt", "timestamp": "2026-05-04T22:01:42.547664"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 21000, "path": "artifacts/c2/checkpoints/ckpt_step0021000.pt", "timestamp": "2026-05-04T22:05:18.903445"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 21500, "path": "artifacts/c2/checkpoints/ckpt_step0021500.pt", "timestamp": "2026-05-04T22:08:54.759245"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 22000, "path": "artifacts/c2/checkpoints/ckpt_step0022000.pt", "timestamp": "2026-05-04T22:12:35.490777"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 22500, "path": "artifacts/c2/checkpoints/ckpt_step0022500.pt", "timestamp": "2026-05-04T22:16:16.910153"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 23000, "path": "artifacts/c2/checkpoints/ckpt_step0023000.pt", "timestamp": "2026-05-04T22:19:57.275761"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 23500, "path": "artifacts/c2/checkpoints/ckpt_step0023500.pt", "timestamp": "2026-05-04T22:23:37.733214"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 23500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:23:38.692307"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 24000, "path": "artifacts/c2/checkpoints/ckpt_step0024000.pt", "timestamp": "2026-05-04T22:27:14.462120"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 24500, "path": "artifacts/c2/checkpoints/ckpt_step0024500.pt", "timestamp": "2026-05-04T22:30:50.186765"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 24500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T22:30:51.110454"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 25000, "path": "artifacts/c2/checkpoints/ckpt_step0025000.pt", "timestamp": "2026-05-04T22:34:26.435459"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 25500, "path": "artifacts/c2/checkpoints/ckpt_step0025500.pt", "timestamp": "2026-05-04T22:38:01.616826"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 26000, "path": "artifacts/c2/checkpoints/ckpt_step0026000.pt", "timestamp": "2026-05-04T22:41:36.171027"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 26500, "path": "artifacts/c2/checkpoints/ckpt_step0026500.pt", "timestamp": "2026-05-04T22:45:12.480833"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 27000, "path": "artifacts/c2/checkpoints/ckpt_step0027000.pt", "timestamp": "2026-05-04T22:48:49.630829"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 27500, "path": "artifacts/c2/checkpoints/ckpt_step0027500.pt", "timestamp": "2026-05-04T22:52:23.987911"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 28000, "path": "artifacts/c2/checkpoints/ckpt_step0028000.pt", "timestamp": "2026-05-04T22:55:57.996561"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 28500, "path": "artifacts/c2/checkpoints/ckpt_step0028500.pt", "timestamp": "2026-05-04T22:59:35.749865"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 29000, "path": "artifacts/c2/checkpoints/ckpt_step0029000.pt", "timestamp": "2026-05-04T23:03:12.706823"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 29500, "path": "artifacts/c2/checkpoints/ckpt_step0029500.pt", "timestamp": "2026-05-04T23:06:47.965913"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 29500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T23:06:48.838561"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 30000, "path": "artifacts/c2/checkpoints/ckpt_step0030000.pt", "timestamp": "2026-05-04T23:10:24.061996"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 30500, "path": "artifacts/c2/checkpoints/ckpt_step0030500.pt", "timestamp": "2026-05-04T23:13:58.988561"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 31000, "path": "artifacts/c2/checkpoints/ckpt_step0031000.pt", "timestamp": "2026-05-04T23:17:34.697407"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 31500, "path": "artifacts/c2/checkpoints/ckpt_step0031500.pt", "timestamp": "2026-05-04T23:21:09.933172"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 32000, "path": "artifacts/c2/checkpoints/ckpt_step0032000.pt", "timestamp": "2026-05-04T23:24:45.779797"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 32500, "path": "artifacts/c2/checkpoints/ckpt_step0032500.pt", "timestamp": "2026-05-04T23:28:20.241536"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 33000, "path": "artifacts/c2/checkpoints/ckpt_step0033000.pt", "timestamp": "2026-05-04T23:31:55.169163"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 33500, "path": "artifacts/c2/checkpoints/ckpt_step0033500.pt", "timestamp": "2026-05-04T23:35:31.951568"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 34000, "path": "artifacts/c2/checkpoints/ckpt_step0034000.pt", "timestamp": "2026-05-04T23:39:07.554608"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 34500, "path": "artifacts/c2/checkpoints/ckpt_step0034500.pt", "timestamp": "2026-05-04T23:42:45.963040"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 35000, "path": "artifacts/c2/checkpoints/ckpt_step0035000.pt", "timestamp": "2026-05-04T23:46:23.037806"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 35500, "path": "artifacts/c2/checkpoints/ckpt_step0035500.pt", "timestamp": "2026-05-04T23:50:01.391079"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 36000, "path": "artifacts/c2/checkpoints/ckpt_step0036000.pt", "timestamp": "2026-05-04T23:53:39.123535"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 36500, "path": "artifacts/c2/checkpoints/ckpt_step0036500.pt", "timestamp": "2026-05-04T23:57:15.042471"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 36500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-04T23:57:15.986028"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 37000, "path": "artifacts/c2/checkpoints/ckpt_step0037000.pt", "timestamp": "2026-05-05T00:00:52.397532"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 37500, "path": "artifacts/c2/checkpoints/ckpt_step0037500.pt", "timestamp": "2026-05-05T00:04:28.488179"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 37500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:04:29.328242"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 38000, "path": "artifacts/c2/checkpoints/ckpt_step0038000.pt", "timestamp": "2026-05-05T00:08:04.476478"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 38500, "path": "artifacts/c2/checkpoints/ckpt_step0038500.pt", "timestamp": "2026-05-05T00:11:39.556054"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 39000, "path": "artifacts/c2/checkpoints/ckpt_step0039000.pt", "timestamp": "2026-05-05T00:15:14.254304"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 39500, "path": "artifacts/c2/checkpoints/ckpt_step0039500.pt", "timestamp": "2026-05-05T00:18:48.741599"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 40000, "path": "artifacts/c2/checkpoints/ckpt_step0040000.pt", "timestamp": "2026-05-05T00:22:23.329858"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 40500, "path": "artifacts/c2/checkpoints/ckpt_step0040500.pt", "timestamp": "2026-05-05T00:25:58.324698"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 41000, "path": "artifacts/c2/checkpoints/ckpt_step0041000.pt", "timestamp": "2026-05-05T00:29:33.613999"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 41000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T00:29:34.493359"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 41500, "path": "artifacts/c2/checkpoints/ckpt_step0041500.pt", "timestamp": "2026-05-05T00:33:09.011262"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 42000, "path": "artifacts/c2/checkpoints/ckpt_step0042000.pt", "timestamp": "2026-05-05T00:36:43.234279"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 42500, "path": "artifacts/c2/checkpoints/ckpt_step0042500.pt", "timestamp": "2026-05-05T00:40:17.669807"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 43000, "path": "artifacts/c2/checkpoints/ckpt_step0043000.pt", "timestamp": "2026-05-05T00:43:52.501341"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 43500, "path": "artifacts/c2/checkpoints/ckpt_step0043500.pt", "timestamp": "2026-05-05T00:47:27.576226"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 44000, "path": "artifacts/c2/checkpoints/ckpt_step0044000.pt", "timestamp": "2026-05-05T00:51:05.492518"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 44500, "path": "artifacts/c2/checkpoints/ckpt_step0044500.pt", "timestamp": "2026-05-05T00:54:41.107238"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 45000, "path": "artifacts/c2/checkpoints/ckpt_step0045000.pt", "timestamp": "2026-05-05T00:58:18.115880"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 45500, "path": "artifacts/c2/checkpoints/ckpt_step0045500.pt", "timestamp": "2026-05-05T01:01:55.098593"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 46000, "path": "artifacts/c2/checkpoints/ckpt_step0046000.pt", "timestamp": "2026-05-05T01:05:28.750126"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 46500, "path": "artifacts/c2/checkpoints/ckpt_step0046500.pt", "timestamp": "2026-05-05T01:09:02.610840"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 47000, "path": "artifacts/c2/checkpoints/ckpt_step0047000.pt", "timestamp": "2026-05-05T01:12:35.776226"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 47500, "path": "artifacts/c2/checkpoints/ckpt_step0047500.pt", "timestamp": "2026-05-05T01:16:08.472641"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 48000, "path": "artifacts/c2/checkpoints/ckpt_step0048000.pt", "timestamp": "2026-05-05T01:19:42.326766"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 48500, "path": "artifacts/c2/checkpoints/ckpt_step0048500.pt", "timestamp": "2026-05-05T01:23:15.584520"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 49000, "path": "artifacts/c2/checkpoints/ckpt_step0049000.pt", "timestamp": "2026-05-05T01:26:49.541401"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 49500, "path": "artifacts/c2/checkpoints/ckpt_step0049500.pt", "timestamp": "2026-05-05T01:30:22.798284"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 50000, "path": "artifacts/c2/checkpoints/ckpt_step0050000.pt", "timestamp": "2026-05-05T01:33:56.893241"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 50500, "path": "artifacts/c2/checkpoints/ckpt_step0050500.pt", "timestamp": "2026-05-05T01:37:30.457284"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 51000, "path": "artifacts/c2/checkpoints/ckpt_step0051000.pt", "timestamp": "2026-05-05T01:41:04.277657"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 51500, "path": "artifacts/c2/checkpoints/ckpt_step0051500.pt", "timestamp": "2026-05-05T01:44:37.249519"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 52000, "path": "artifacts/c2/checkpoints/ckpt_step0052000.pt", "timestamp": "2026-05-05T01:48:11.602737"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 52500, "path": "artifacts/c2/checkpoints/ckpt_step0052500.pt", "timestamp": "2026-05-05T01:51:45.550140"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 53000, "path": "artifacts/c2/checkpoints/ckpt_step0053000.pt", "timestamp": "2026-05-05T01:55:20.569368"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 53000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T01:55:21.509022"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 53500, "path": "artifacts/c2/checkpoints/ckpt_step0053500.pt", "timestamp": "2026-05-05T01:58:56.759123"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 54000, "path": "artifacts/c2/checkpoints/ckpt_step0054000.pt", "timestamp": "2026-05-05T02:02:37.198236"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 54000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T02:02:38.124472"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 54500, "path": "artifacts/c2/checkpoints/ckpt_step0054500.pt", "timestamp": "2026-05-05T02:06:14.593044"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 55000, "path": "artifacts/c2/checkpoints/ckpt_step0055000.pt", "timestamp": "2026-05-05T02:09:50.577235"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 55500, "path": "artifacts/c2/checkpoints/ckpt_step0055500.pt", "timestamp": "2026-05-05T02:13:25.929470"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 56000, "path": "artifacts/c2/checkpoints/ckpt_step0056000.pt", "timestamp": "2026-05-05T02:17:01.005635"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 56500, "path": "artifacts/c2/checkpoints/ckpt_step0056500.pt", "timestamp": "2026-05-05T02:20:35.058409"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 57000, "path": "artifacts/c2/checkpoints/ckpt_step0057000.pt", "timestamp": "2026-05-05T02:24:09.182984"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 57500, "path": "artifacts/c2/checkpoints/ckpt_step0057500.pt", "timestamp": "2026-05-05T02:27:43.001859"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 58000, "path": "artifacts/c2/checkpoints/ckpt_step0058000.pt", "timestamp": "2026-05-05T02:31:16.149978"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 58500, "path": "artifacts/c2/checkpoints/ckpt_step0058500.pt", "timestamp": "2026-05-05T02:34:50.291544"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 59000, "path": "artifacts/c2/checkpoints/ckpt_step0059000.pt", "timestamp": "2026-05-05T02:38:24.555747"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 59500, "path": "artifacts/c2/checkpoints/ckpt_step0059500.pt", "timestamp": "2026-05-05T02:41:58.967242"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 60000, "path": "artifacts/c2/checkpoints/ckpt_step0060000.pt", "timestamp": "2026-05-05T02:45:33.668284"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 60500, "path": "artifacts/c2/checkpoints/ckpt_step0060500.pt", "timestamp": "2026-05-05T02:49:07.661930"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 61000, "path": "artifacts/c2/checkpoints/ckpt_step0061000.pt", "timestamp": "2026-05-05T02:52:42.478664"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 61500, "path": "artifacts/c2/checkpoints/ckpt_step0061500.pt", "timestamp": "2026-05-05T02:56:18.138931"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 62000, "path": "artifacts/c2/checkpoints/ckpt_step0062000.pt", "timestamp": "2026-05-05T02:59:52.909119"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 62500, "path": "artifacts/c2/checkpoints/ckpt_step0062500.pt", "timestamp": "2026-05-05T03:03:28.146235"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 63000, "path": "artifacts/c2/checkpoints/ckpt_step0063000.pt", "timestamp": "2026-05-05T03:07:02.081683"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 63000, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T03:07:02.997468"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 63500, "path": "artifacts/c2/checkpoints/ckpt_step0063500.pt", "timestamp": "2026-05-05T03:10:40.623001"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 64000, "path": "artifacts/c2/checkpoints/ckpt_step0064000.pt", "timestamp": "2026-05-05T03:14:10.206324"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 64500, "path": "artifacts/c2/checkpoints/ckpt_step0064500.pt", "timestamp": "2026-05-05T03:17:40.773151"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 65000, "path": "artifacts/c2/checkpoints/ckpt_step0065000.pt", "timestamp": "2026-05-05T03:21:10.271135"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 65500, "path": "artifacts/c2/checkpoints/ckpt_step0065500.pt", "timestamp": "2026-05-05T03:24:39.893399"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 66000, "path": "artifacts/c2/checkpoints/ckpt_step0066000.pt", "timestamp": "2026-05-05T03:28:10.440559"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 66500, "path": "artifacts/c2/checkpoints/ckpt_step0066500.pt", "timestamp": "2026-05-05T03:31:41.292818"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 67000, "path": "artifacts/c2/checkpoints/ckpt_step0067000.pt", "timestamp": "2026-05-05T03:35:11.743968"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 67500, "path": "artifacts/c2/checkpoints/ckpt_step0067500.pt", "timestamp": "2026-05-05T03:38:41.753218"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 68000, "path": "artifacts/c2/checkpoints/ckpt_step0068000.pt", "timestamp": "2026-05-05T03:42:11.607967"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 68500, "path": "artifacts/c2/checkpoints/ckpt_step0068500.pt", "timestamp": "2026-05-05T03:45:40.732238"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 69000, "path": "artifacts/c2/checkpoints/ckpt_step0069000.pt", "timestamp": "2026-05-05T03:49:09.216500"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 69500, "path": "artifacts/c2/checkpoints/ckpt_step0069500.pt", "timestamp": "2026-05-05T03:52:38.451307"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 70000, "path": "artifacts/c2/checkpoints/ckpt_step0070000.pt", "timestamp": "2026-05-05T03:56:07.767576"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 70500, "path": "artifacts/c2/checkpoints/ckpt_step0070500.pt", "timestamp": "2026-05-05T03:59:36.145726"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 71000, "path": "artifacts/c2/checkpoints/ckpt_step0071000.pt", "timestamp": "2026-05-05T04:03:05.144792"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 71500, "path": "artifacts/c2/checkpoints/ckpt_step0071500.pt", "timestamp": "2026-05-05T04:06:34.400719"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 72000, "path": "artifacts/c2/checkpoints/ckpt_step0072000.pt", "timestamp": "2026-05-05T04:10:03.602582"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 72500, "path": "artifacts/c2/checkpoints/ckpt_step0072500.pt", "timestamp": "2026-05-05T04:13:33.400362"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 73000, "path": "artifacts/c2/checkpoints/ckpt_step0073000.pt", "timestamp": "2026-05-05T04:17:02.914126"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 73500, "path": "artifacts/c2/checkpoints/ckpt_step0073500.pt", "timestamp": "2026-05-05T04:20:32.300875"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 74000, "path": "artifacts/c2/checkpoints/ckpt_step0074000.pt", "timestamp": "2026-05-05T04:24:02.049636"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 74500, "path": "artifacts/c2/checkpoints/ckpt_step0074500.pt", "timestamp": "2026-05-05T04:27:31.200827"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 75000, "path": "artifacts/c2/checkpoints/ckpt_step0075000.pt", "timestamp": "2026-05-05T04:31:00.636999"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 75500, "path": "artifacts/c2/checkpoints/ckpt_step0075500.pt", "timestamp": "2026-05-05T04:34:29.719933"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 76000, "path": "artifacts/c2/checkpoints/ckpt_step0076000.pt", "timestamp": "2026-05-05T04:37:59.679950"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 76500, "path": "artifacts/c2/checkpoints/ckpt_step0076500.pt", "timestamp": "2026-05-05T04:41:29.125304"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 77000, "path": "artifacts/c2/checkpoints/ckpt_step0077000.pt", "timestamp": "2026-05-05T04:44:58.189302"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 77500, "path": "artifacts/c2/checkpoints/ckpt_step0077500.pt", "timestamp": "2026-05-05T04:48:27.045411"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 78000, "path": "artifacts/c2/checkpoints/ckpt_step0078000.pt", "timestamp": "2026-05-05T04:51:55.803709"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 78500, "path": "artifacts/c2/checkpoints/ckpt_step0078500.pt", "timestamp": "2026-05-05T04:55:24.816039"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 79000, "path": "artifacts/c2/checkpoints/ckpt_step0079000.pt", "timestamp": "2026-05-05T04:58:53.749490"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 79500, "path": "artifacts/c2/checkpoints/ckpt_step0079500.pt", "timestamp": "2026-05-05T05:02:23.187466"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 80000, "path": "artifacts/c2/checkpoints/ckpt_step0080000.pt", "timestamp": "2026-05-05T05:05:51.789635"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 80500, "path": "artifacts/c2/checkpoints/ckpt_step0080500.pt", "timestamp": "2026-05-05T05:09:20.988700"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 81000, "path": "artifacts/c2/checkpoints/ckpt_step0081000.pt", "timestamp": "2026-05-05T05:12:50.742366"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 81500, "path": "artifacts/c2/checkpoints/ckpt_step0081500.pt", "timestamp": "2026-05-05T05:16:18.314073"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 82000, "path": "artifacts/c2/checkpoints/ckpt_step0082000.pt", "timestamp": "2026-05-05T05:19:45.731644"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 82500, "path": "artifacts/c2/checkpoints/ckpt_step0082500.pt", "timestamp": "2026-05-05T05:23:13.590769"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 83000, "path": "artifacts/c2/checkpoints/ckpt_step0083000.pt", "timestamp": "2026-05-05T05:26:41.488695"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 83500, "path": "artifacts/c2/checkpoints/ckpt_step0083500.pt", "timestamp": "2026-05-05T05:30:10.015029"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 84000, "path": "artifacts/c2/checkpoints/ckpt_step0084000.pt", "timestamp": "2026-05-05T05:33:38.459867"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 84500, "path": "artifacts/c2/checkpoints/ckpt_step0084500.pt", "timestamp": "2026-05-05T05:37:07.695034"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 85000, "path": "artifacts/c2/checkpoints/ckpt_step0085000.pt", "timestamp": "2026-05-05T05:40:35.566712"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 85500, "path": "artifacts/c2/checkpoints/ckpt_step0085500.pt", "timestamp": "2026-05-05T05:44:04.855637"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 86000, "path": "artifacts/c2/checkpoints/ckpt_step0086000.pt", "timestamp": "2026-05-05T05:47:32.968873"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 86500, "path": "artifacts/c2/checkpoints/ckpt_step0086500.pt", "timestamp": "2026-05-05T05:51:01.778350"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 87000, "path": "artifacts/c2/checkpoints/ckpt_step0087000.pt", "timestamp": "2026-05-05T05:54:30.481515"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 87500, "path": "artifacts/c2/checkpoints/ckpt_step0087500.pt", "timestamp": "2026-05-05T05:58:00.050529"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 87500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T05:58:00.987741"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 88000, "path": "artifacts/c2/checkpoints/ckpt_step0088000.pt", "timestamp": "2026-05-05T06:01:29.694602"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 88500, "path": "artifacts/c2/checkpoints/ckpt_step0088500.pt", "timestamp": "2026-05-05T06:04:58.783944"}
{"run_name": "c2", "stage": "pretraining", "event": "best_checkpoint_saved", "step": 88500, "path": "artifacts/c2/checkpoints/best_ckpt.pt", "timestamp": "2026-05-05T06:04:59.598538"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 89000, "path": "artifacts/c2/checkpoints/ckpt_step0089000.pt", "timestamp": "2026-05-05T06:08:28.132788"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 89500, "path": "artifacts/c2/checkpoints/ckpt_step0089500.pt", "timestamp": "2026-05-05T06:11:56.919763"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 90000, "path": "artifacts/c2/checkpoints/ckpt_step0090000.pt", "timestamp": "2026-05-05T06:15:24.500092"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 90500, "path": "artifacts/c2/checkpoints/ckpt_step0090500.pt", "timestamp": "2026-05-05T06:18:52.669982"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 91000, "path": "artifacts/c2/checkpoints/ckpt_step0091000.pt", "timestamp": "2026-05-05T06:22:21.345356"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 91500, "path": "artifacts/c2/checkpoints/ckpt_step0091500.pt", "timestamp": "2026-05-05T06:25:49.995493"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 92000, "path": "artifacts/c2/checkpoints/ckpt_step0092000.pt", "timestamp": "2026-05-05T06:29:18.544358"}
{"run_name": "c2", "stage": "pretraining", "event": "checkpoint_saved", "step": 92500, "path": "artifacts/c2/checkpoints/ckpt_step0092500.pt", "timestamp": "2026-05-05T06:32:47.267711"}
{"run_name": "c2", "stage": "pretraining", "event": "final_checkpoint_saved", "step": 92685, "path": "artifacts/c2/checkpoints/ckpt_step0092685.pt", "best_val_loss_so_far": 3.3613099455833435, "timestamp": "2026-05-05T06:34:04.509790"}
{"run_name": "c2", "stage": "pretraining", "event": "metrics_plot_saved", "path": "artifacts/c2/metrics.png", "timestamp": "2026-05-05T06:34:06.673898"}
{"run_name": "c2", "stage": "pretraining", "event": "results_doc_saved", "path": "artifacts/c2/results.md", "timestamp": "2026-05-05T06:34:06.674076"}