| { |
| "config": { |
| "rl_action": "train", |
| "model_type": "impala", |
| "lr": 5e-05, |
| "discount_rate": 0.99, |
| "num_rollout_steps": 64, |
| "grad_acc_per_chunk": 4, |
| "num_rollout_chunks": 1, |
| "cheese_loc": "any", |
| "env_layout": "open", |
| "alpha": 0.0, |
| "env_size": 13, |
| "num_levels": 9600, |
| "compile": true, |
| "use_prev_action": false, |
| "weight_restrictions": null, |
| "weight_restrictions_invert": false, |
| "use_bf16": false, |
| "use_wandb": true, |
| "no_tqdm": false, |
| "seed": 335466400, |
| "mask_type": "first_episode", |
| "ckpt_dir": "jaxgmg_fleet_test", |
| "vis_average_state": false, |
| "trim_episodes": false, |
| "num_total_env_steps": 9830400, |
| "eval_every": 1, |
| "eff_horizon": null, |
| "optim": "adam", |
| "env_rule": null, |
| "env_rule_mixture": null, |
| "hf_user": "timaeus", |
| "hf_collection": "davidquarel/jaxgmg", |
| "use_hf": true, |
| "num_hf_uploads": 1, |
| "use_log": true, |
| "log_optimizer_state": false, |
| "resume": null, |
| "resume_id": null, |
| "resume_optim": false, |
| "checkpoint": "DUMMY", |
| "wandb_project": "jaxgmg_fleet_test", |
| "eval_schedule": "0:1", |
| "render_sixel": false, |
| "sixel_idx": 60, |
| "live_monitor": false, |
| "run_id": 0, |
| "seed_formula": null, |
| "deterministic": true, |
| "penalize_time": false, |
| "f_str_ckpt": null, |
| "duplication_factor": -1, |
| "smoke": false, |
| "ntfy": "david_jaxgmg", |
| "num_chains": 6, |
| "num_draws": 3000, |
| "num_steps_bw_draws": 1, |
| "on_policy": true, |
| "llc_nbeta": 3000, |
| "localization": 10, |
| "exact_solver_each_draw": false, |
| "llc_optimizer": "sgld", |
| "iw_clip_eps": null, |
| "rmsprop_burnin_steps": 20, |
| "llc_data_file": "llc_scan_open_reinforce.pkl", |
| "llc_checkpoint_index": null, |
| "llc_checkpoint_number": null, |
| "sink": null, |
| "repo_id": "davidquarel/jaxgmg_ckpt_zip", |
| "use_shuffled_checkpoints": false, |
| "force_re_download": false, |
| "off_distribution_data": false, |
| "evaluate_every_position": false, |
| "num_prev_actions": 1, |
| "eff_acc_steps": 4, |
| "chunk_size": 9600, |
| "env_steps_per_microbatch": 153600, |
| "ckpt_path": "jaxgmg_fleet_test/DUMMY", |
| "env_steps_per_loop": 614400, |
| "total_loops": 16 |
| }, |
| "setup": { |
| "start_time_utc": "2026-03-25T23:54:22.083684Z", |
| "seed": 335466400, |
| "device": "cuda", |
| "python_version": "3.11.11", |
| "torch_version": "2.10.0+cu128", |
| "jax_version": "0.6.2", |
| "hostname": "3449f5e2b7d7", |
| "platform": "Linux-6.8.0-58-lowlatency-x86_64-with-glibc2.39", |
| "git_sha": null, |
| "git_branch": null, |
| "use_wandb": true |
| } |
| } |