{ "final_checkpoint": "/home/seonho/arnold/dit_only_phase1_ckpt/checkpoints/100000", "last_grad_norm": 0.4453125, "last_loss_finite": true, "last_lr": 0.0, "last_policy_update_called": false, "last_scalars": { "loss": 0.01060287281870842 }, "loaded_pretrained_model_path": null, "method": "base", "phase": "phase2", "policy_type": "groot", "script_name": "train_groot_arnold_yaml.py", "steps_completed": 100000, "steps_requested": 100000 }