davidquarel commited on
Commit
a36c818
·
verified ·
1 Parent(s): fb44126

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/action_logprobs.pth.gz +3 -0
  2. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/action_probs.tar.gz +3 -0
  3. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/checkpoints.tar.gz +3 -0
  4. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/config.cfg +84 -0
  5. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/config.json +86 -0
  6. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/eval.jsonl +0 -0
  7. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/eval.log +0 -0
  8. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/latest_train.json +12 -0
  9. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/optimizer_state.tar.gz +3 -0
  10. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/patterning.log +15 -0
  11. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/setup.json +101 -0
  12. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/setup.txt +8 -0
  13. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/state_counts.npy +3 -0
  14. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/train.jsonl +0 -0
  15. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/train.log +0 -0
  16. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/action_logprobs.pth.gz +3 -0
  17. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/action_probs.tar.gz +3 -0
  18. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/checkpoints.tar.gz +3 -0
  19. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/config.cfg +84 -0
  20. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/config.json +86 -0
  21. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/eval.jsonl +0 -0
  22. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/eval.log +0 -0
  23. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/latest_train.json +12 -0
  24. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/optimizer_state.tar.gz +3 -0
  25. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/patterning.log +15 -0
  26. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/setup.json +101 -0
  27. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/setup.txt +8 -0
  28. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/state_counts.npy +3 -0
  29. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/train.jsonl +0 -0
  30. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/train.log +0 -0
  31. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/action_logprobs.pth.gz +3 -0
  32. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/action_probs.tar.gz +3 -0
  33. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/checkpoints.tar.gz +3 -0
  34. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/config.cfg +84 -0
  35. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/config.json +86 -0
  36. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/eval.jsonl +0 -0
  37. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/eval.log +0 -0
  38. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/latest_train.json +12 -0
  39. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/optimizer_state.tar.gz +3 -0
  40. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/patterning.log +15 -0
  41. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/setup.json +101 -0
  42. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/setup.txt +8 -0
  43. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/state_counts.npy +3 -0
  44. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/train.jsonl +0 -0
  45. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/train.log +0 -0
  46. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/action_logprobs.pth.gz +3 -0
  47. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/action_probs.tar.gz +3 -0
  48. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/checkpoints.tar.gz +3 -0
  49. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/config.cfg +83 -0
  50. al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/config.json +85 -0
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/action_logprobs.pth.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6df348f65eb8600440510d1ce6c80d9ffb84fa2a8f3e26861103631fff60148c
3
+ size 213015295
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/action_probs.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2845d72b4613764be1d3240dcfcf29f715a7be0a410cf0e0d5ae17239872cb56
3
+ size 120673169
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/checkpoints.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f5ed1f85f8f7000743ff20f9766d9374a0799d72b5d653491487cf609f32ee8
3
+ size 1225772629
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/config.cfg ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ rl_action=train
2
+ model_type=impala
3
+ lr=5e-05
4
+ discount_rate=0.98
5
+ num_rollout_steps=64
6
+ grad_acc_per_chunk=4
7
+ num_rollout_chunks=1
8
+ cheese_loc=any
9
+ env_layout=open
10
+ alpha=1.0
11
+ env_size=13
12
+ num_levels=9600
13
+ compile=True
14
+ use_prev_action=False
15
+ weight_restrictions=None
16
+ weight_restrictions_invert=False
17
+ use_bf16=False
18
+ use_wandb=True
19
+ seed=42
20
+ mask_type=first_episode
21
+ ckpt_dir=jaxgmg2_3phase_optim_state_patt
22
+ vis_average_state=False
23
+ trim_episodes=False
24
+ num_total_env_steps=7372800000
25
+ eval_every=1
26
+ eff_horizon=None
27
+ optim=adam
28
+ env_rule=None
29
+ hf_user=davidquarel
30
+ hf_collection=None
31
+ use_hf=True
32
+ num_hf_uploads=1
33
+ use_log=True
34
+ log_optimizer_state=True
35
+ resume=jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
36
+ resume_id=1330
37
+ resume_optim=True
38
+ checkpoint=al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000
39
+ wandb_project=jaxgmg2_patt
40
+ eval_schedule=0:1,250:2,500:5,2000:10
41
+ render_sixel=False
42
+ sixel_idx=60
43
+ live_monitor=False
44
+ run_id=0
45
+ seed_formula=None
46
+ deterministic=True
47
+ penalize_time=False
48
+ f_str_ckpt=None
49
+ duplication_factor=-1
50
+ smoke=False
51
+ ntfy=None
52
+ num_chains=6
53
+ num_draws=3000
54
+ num_steps_bw_draws=1
55
+ on_policy=True
56
+ llc_nbeta=3000
57
+ localization=10
58
+ exact_solver_each_draw=False
59
+ llc_optimizer=sgld
60
+ iw_clip_eps=None
61
+ rmsprop_burnin_steps=20
62
+ llc_data_file=llc_scan_open_reinforce.pkl
63
+ llc_checkpoint_index=None
64
+ llc_checkpoint_number=None
65
+ sink=None
66
+ repo_id=davidquarel/jaxgmg_ckpt_zip
67
+ use_shuffled_checkpoints=False
68
+ force_re_download=False
69
+ off_distribution_data=False
70
+ evaluate_every_position=False
71
+ num_prev_actions=1
72
+ eff_acc_steps=4
73
+ chunk_size=9600
74
+ env_steps_per_microbatch=153600
75
+ ckpt_path=jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000
76
+ env_steps_per_loop=614400
77
+ total_loops=12000
78
+ patt_mode=mp-inv
79
+ patt_h=0.0
80
+ patt_use_hmax=False
81
+ patt_t=0
82
+ patt_cluster=east
83
+ suscept_id=2000
84
+ model_id=al_1.0_g_0.98_id_19_seed_981019
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/config.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha": 1.0,
3
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000",
4
+ "cheese_loc": "any",
5
+ "chunk_size": 9600,
6
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
7
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000",
8
+ "compile": true,
9
+ "deterministic": true,
10
+ "discount_rate": 0.98,
11
+ "duplication_factor": -1,
12
+ "eff_acc_steps": 4,
13
+ "eff_horizon": null,
14
+ "env_layout": "open",
15
+ "env_rule": null,
16
+ "env_size": 13,
17
+ "env_steps_per_loop": 614400,
18
+ "env_steps_per_microbatch": 153600,
19
+ "eval_every": 1,
20
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
21
+ "evaluate_every_position": false,
22
+ "exact_solver_each_draw": false,
23
+ "f_str_ckpt": null,
24
+ "force_re_download": false,
25
+ "grad_acc_per_chunk": 4,
26
+ "hf_collection": null,
27
+ "hf_user": "davidquarel",
28
+ "iw_clip_eps": null,
29
+ "live_monitor": false,
30
+ "llc_checkpoint_index": null,
31
+ "llc_checkpoint_number": null,
32
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
33
+ "llc_nbeta": 3000,
34
+ "llc_optimizer": "sgld",
35
+ "localization": 10,
36
+ "log_optimizer_state": true,
37
+ "lr": 5e-05,
38
+ "mask_type": "first_episode",
39
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019",
40
+ "model_type": "impala",
41
+ "ntfy": null,
42
+ "num_chains": 6,
43
+ "num_draws": 3000,
44
+ "num_hf_uploads": 1,
45
+ "num_levels": 9600,
46
+ "num_prev_actions": 1,
47
+ "num_rollout_chunks": 1,
48
+ "num_rollout_steps": 64,
49
+ "num_steps_bw_draws": 1,
50
+ "num_total_env_steps": 7372800000,
51
+ "off_distribution_data": false,
52
+ "on_policy": true,
53
+ "optim": "adam",
54
+ "patt_cluster": "east",
55
+ "patt_h": 0.0,
56
+ "patt_mode": "mp-inv",
57
+ "patt_t": 0,
58
+ "patt_use_hmax": false,
59
+ "penalize_time": false,
60
+ "render_sixel": false,
61
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
62
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
63
+ "resume_id": 1330,
64
+ "resume_optim": true,
65
+ "rl_action": "train",
66
+ "rmsprop_burnin_steps": 20,
67
+ "run_id": 0,
68
+ "seed": 42,
69
+ "seed_formula": null,
70
+ "sink": null,
71
+ "sixel_idx": 60,
72
+ "smoke": false,
73
+ "suscept_id": 2000,
74
+ "total_loops": 12000,
75
+ "trim_episodes": false,
76
+ "use_bf16": false,
77
+ "use_hf": true,
78
+ "use_log": true,
79
+ "use_prev_action": false,
80
+ "use_shuffled_checkpoints": false,
81
+ "use_wandb": true,
82
+ "vis_average_state": false,
83
+ "wandb_project": "jaxgmg2_patt",
84
+ "weight_restrictions": null,
85
+ "weight_restrictions_invert": false
86
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/eval.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/eval.log ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/latest_train.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2026-03-05T19:56:01.816596Z",
3
+ "loop": 11999,
4
+ "env_steps": 7372799999,
5
+ "loss": 0.027530066668987274,
6
+ "avg_return": 0.8819411396980286,
7
+ "regret": 0.00022316505783237517,
8
+ "entropy": 0.10536854714155197,
9
+ "lr": 5e-05,
10
+ "discount_rate": 0.98,
11
+ "num_rollout_steps": 64
12
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/optimizer_state.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63104de909e3e93b5e529582f027eaf9e52447d03ee4bf5d55436886ac05f9dc
3
+ size 2208054834
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/patterning.log ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ============================================================
2
+ Patterning config summary
3
+ ============================================================
4
+ patt_mode: mp-inv
5
+ patt_h: 0.0
6
+ patt_cluster: east
7
+ alpha: 1.0
8
+ model_id: al_1.0_g_0.98_id_19_seed_981019
9
+ resume: jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
10
+ resume_id: 1330
11
+ resume_optim: True
12
+ suscept_id: 2000
13
+ ckpt_path: jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000
14
+ smoke: False
15
+ ============================================================
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/setup.json ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "rl_action": "train",
4
+ "model_type": "impala",
5
+ "lr": 5e-05,
6
+ "discount_rate": 0.98,
7
+ "num_rollout_steps": 64,
8
+ "grad_acc_per_chunk": 4,
9
+ "num_rollout_chunks": 1,
10
+ "cheese_loc": "any",
11
+ "env_layout": "open",
12
+ "alpha": 1.0,
13
+ "env_size": 13,
14
+ "num_levels": 9600,
15
+ "compile": true,
16
+ "use_prev_action": false,
17
+ "weight_restrictions": null,
18
+ "weight_restrictions_invert": false,
19
+ "use_bf16": false,
20
+ "use_wandb": true,
21
+ "seed": 42,
22
+ "mask_type": "first_episode",
23
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
24
+ "vis_average_state": false,
25
+ "trim_episodes": false,
26
+ "num_total_env_steps": 7372800000,
27
+ "eval_every": 1,
28
+ "eff_horizon": null,
29
+ "optim": "adam",
30
+ "env_rule": null,
31
+ "hf_user": "davidquarel",
32
+ "hf_collection": null,
33
+ "use_hf": true,
34
+ "num_hf_uploads": 1,
35
+ "use_log": true,
36
+ "log_optimizer_state": true,
37
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
38
+ "resume_id": 1330,
39
+ "resume_optim": true,
40
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000",
41
+ "wandb_project": "jaxgmg2_patt",
42
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
43
+ "render_sixel": false,
44
+ "sixel_idx": 60,
45
+ "live_monitor": false,
46
+ "run_id": 0,
47
+ "seed_formula": null,
48
+ "deterministic": true,
49
+ "penalize_time": false,
50
+ "f_str_ckpt": null,
51
+ "duplication_factor": -1,
52
+ "smoke": false,
53
+ "ntfy": null,
54
+ "num_chains": 6,
55
+ "num_draws": 3000,
56
+ "num_steps_bw_draws": 1,
57
+ "on_policy": true,
58
+ "llc_nbeta": 3000,
59
+ "localization": 10,
60
+ "exact_solver_each_draw": false,
61
+ "llc_optimizer": "sgld",
62
+ "iw_clip_eps": null,
63
+ "rmsprop_burnin_steps": 20,
64
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
65
+ "llc_checkpoint_index": null,
66
+ "llc_checkpoint_number": null,
67
+ "sink": null,
68
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
69
+ "use_shuffled_checkpoints": false,
70
+ "force_re_download": false,
71
+ "off_distribution_data": false,
72
+ "evaluate_every_position": false,
73
+ "num_prev_actions": 1,
74
+ "eff_acc_steps": 4,
75
+ "chunk_size": 9600,
76
+ "env_steps_per_microbatch": 153600,
77
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000",
78
+ "env_steps_per_loop": 614400,
79
+ "total_loops": 12000,
80
+ "patt_mode": "mp-inv",
81
+ "patt_h": 0.0,
82
+ "patt_use_hmax": false,
83
+ "patt_t": 0,
84
+ "patt_cluster": "east",
85
+ "suscept_id": 2000,
86
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019"
87
+ },
88
+ "setup": {
89
+ "start_time_utc": "2026-03-05T17:08:14.446346Z",
90
+ "seed": 42,
91
+ "device": "cuda",
92
+ "python_version": "3.11.11",
93
+ "torch_version": "2.10.0+cu128",
94
+ "jax_version": "0.6.2",
95
+ "hostname": "e5babfa66034",
96
+ "platform": "Linux-6.8.0-60-generic-x86_64-with-glibc2.39",
97
+ "git_sha": null,
98
+ "git_branch": null,
99
+ "use_wandb": true
100
+ }
101
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/setup.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ Start: 2026-03-05T17:08:14.446346Z
2
+ Seed: 42
3
+ Device: cuda
4
+ Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2
5
+ Host: e5babfa66034
6
+ Platform: Linux-6.8.0-60-generic-x86_64-with-glibc2.39
7
+ Git: branch=None sha=None
8
+ use_wandb: True
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/state_counts.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2e846ebe74d24c870871207d8d2f460d8355f6288e941990ee3766922f96e8
3
+ size 116288
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/train.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_1330_sus_2000_seed_42/train.log ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/action_logprobs.pth.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee3765aad71651cc3d62d3d6fb7ef4483c28a790b5b653560af33f73b905fc0d
3
+ size 211718989
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/action_probs.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57f82ecdab77005d57694b9705a3572c5bbded5a6f0dd8ec950f367abe232c28
3
+ size 151761320
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/checkpoints.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d63fd7fb6a922c9dbeac5a894a0abcfe94938aa29546b5548f9282619fdd1ec8
3
+ size 1225712169
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/config.cfg ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ rl_action=train
2
+ model_type=impala
3
+ lr=5e-05
4
+ discount_rate=0.98
5
+ num_rollout_steps=64
6
+ grad_acc_per_chunk=4
7
+ num_rollout_chunks=1
8
+ cheese_loc=any
9
+ env_layout=open
10
+ alpha=1.0
11
+ env_size=13
12
+ num_levels=9600
13
+ compile=True
14
+ use_prev_action=False
15
+ weight_restrictions=None
16
+ weight_restrictions_invert=False
17
+ use_bf16=False
18
+ use_wandb=True
19
+ seed=42
20
+ mask_type=first_episode
21
+ ckpt_dir=jaxgmg2_3phase_optim_state_patt
22
+ vis_average_state=False
23
+ trim_episodes=False
24
+ num_total_env_steps=7372800000
25
+ eval_every=1
26
+ eff_horizon=None
27
+ optim=adam
28
+ env_rule=None
29
+ hf_user=davidquarel
30
+ hf_collection=None
31
+ use_hf=True
32
+ num_hf_uploads=1
33
+ use_log=True
34
+ log_optimizer_state=True
35
+ resume=jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
36
+ resume_id=175
37
+ resume_optim=True
38
+ checkpoint=al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000
39
+ wandb_project=jaxgmg2_patt
40
+ eval_schedule=0:1,250:2,500:5,2000:10
41
+ render_sixel=False
42
+ sixel_idx=60
43
+ live_monitor=False
44
+ run_id=0
45
+ seed_formula=None
46
+ deterministic=True
47
+ penalize_time=False
48
+ f_str_ckpt=None
49
+ duplication_factor=-1
50
+ smoke=False
51
+ ntfy=None
52
+ num_chains=6
53
+ num_draws=3000
54
+ num_steps_bw_draws=1
55
+ on_policy=True
56
+ llc_nbeta=3000
57
+ localization=10
58
+ exact_solver_each_draw=False
59
+ llc_optimizer=sgld
60
+ iw_clip_eps=None
61
+ rmsprop_burnin_steps=20
62
+ llc_data_file=llc_scan_open_reinforce.pkl
63
+ llc_checkpoint_index=None
64
+ llc_checkpoint_number=None
65
+ sink=None
66
+ repo_id=davidquarel/jaxgmg_ckpt_zip
67
+ use_shuffled_checkpoints=False
68
+ force_re_download=False
69
+ off_distribution_data=False
70
+ evaluate_every_position=False
71
+ num_prev_actions=1
72
+ eff_acc_steps=4
73
+ chunk_size=9600
74
+ env_steps_per_microbatch=153600
75
+ ckpt_path=jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000
76
+ env_steps_per_loop=614400
77
+ total_loops=12000
78
+ patt_mode=mp-inv
79
+ patt_h=0.0
80
+ patt_use_hmax=False
81
+ patt_t=0
82
+ patt_cluster=east
83
+ suscept_id=2000
84
+ model_id=al_1.0_g_0.98_id_19_seed_981019
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/config.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha": 1.0,
3
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000",
4
+ "cheese_loc": "any",
5
+ "chunk_size": 9600,
6
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
7
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000",
8
+ "compile": true,
9
+ "deterministic": true,
10
+ "discount_rate": 0.98,
11
+ "duplication_factor": -1,
12
+ "eff_acc_steps": 4,
13
+ "eff_horizon": null,
14
+ "env_layout": "open",
15
+ "env_rule": null,
16
+ "env_size": 13,
17
+ "env_steps_per_loop": 614400,
18
+ "env_steps_per_microbatch": 153600,
19
+ "eval_every": 1,
20
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
21
+ "evaluate_every_position": false,
22
+ "exact_solver_each_draw": false,
23
+ "f_str_ckpt": null,
24
+ "force_re_download": false,
25
+ "grad_acc_per_chunk": 4,
26
+ "hf_collection": null,
27
+ "hf_user": "davidquarel",
28
+ "iw_clip_eps": null,
29
+ "live_monitor": false,
30
+ "llc_checkpoint_index": null,
31
+ "llc_checkpoint_number": null,
32
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
33
+ "llc_nbeta": 3000,
34
+ "llc_optimizer": "sgld",
35
+ "localization": 10,
36
+ "log_optimizer_state": true,
37
+ "lr": 5e-05,
38
+ "mask_type": "first_episode",
39
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019",
40
+ "model_type": "impala",
41
+ "ntfy": null,
42
+ "num_chains": 6,
43
+ "num_draws": 3000,
44
+ "num_hf_uploads": 1,
45
+ "num_levels": 9600,
46
+ "num_prev_actions": 1,
47
+ "num_rollout_chunks": 1,
48
+ "num_rollout_steps": 64,
49
+ "num_steps_bw_draws": 1,
50
+ "num_total_env_steps": 7372800000,
51
+ "off_distribution_data": false,
52
+ "on_policy": true,
53
+ "optim": "adam",
54
+ "patt_cluster": "east",
55
+ "patt_h": 0.0,
56
+ "patt_mode": "mp-inv",
57
+ "patt_t": 0,
58
+ "patt_use_hmax": false,
59
+ "penalize_time": false,
60
+ "render_sixel": false,
61
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
62
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
63
+ "resume_id": 175,
64
+ "resume_optim": true,
65
+ "rl_action": "train",
66
+ "rmsprop_burnin_steps": 20,
67
+ "run_id": 0,
68
+ "seed": 42,
69
+ "seed_formula": null,
70
+ "sink": null,
71
+ "sixel_idx": 60,
72
+ "smoke": false,
73
+ "suscept_id": 2000,
74
+ "total_loops": 12000,
75
+ "trim_episodes": false,
76
+ "use_bf16": false,
77
+ "use_hf": true,
78
+ "use_log": true,
79
+ "use_prev_action": false,
80
+ "use_shuffled_checkpoints": false,
81
+ "use_wandb": true,
82
+ "vis_average_state": false,
83
+ "wandb_project": "jaxgmg2_patt",
84
+ "weight_restrictions": null,
85
+ "weight_restrictions_invert": false
86
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/eval.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/eval.log ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/latest_train.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2026-03-05T19:55:05.283675Z",
3
+ "loop": 11999,
4
+ "env_steps": 7372799999,
5
+ "loss": 0.026208939030766487,
6
+ "avg_return": 0.8814659118652344,
7
+ "regret": 0.00043080400791950524,
8
+ "entropy": 0.09881289303302765,
9
+ "lr": 5e-05,
10
+ "discount_rate": 0.98,
11
+ "num_rollout_steps": 64
12
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/optimizer_state.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6295d736bee455a06622ed134188c870ab7061a83c4363615ccf5035d18b87c1
3
+ size 2217353163
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/patterning.log ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ============================================================
2
+ Patterning config summary
3
+ ============================================================
4
+ patt_mode: mp-inv
5
+ patt_h: 0.0
6
+ patt_cluster: east
7
+ alpha: 1.0
8
+ model_id: al_1.0_g_0.98_id_19_seed_981019
9
+ resume: jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
10
+ resume_id: 175
11
+ resume_optim: True
12
+ suscept_id: 2000
13
+ ckpt_path: jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000
14
+ smoke: False
15
+ ============================================================
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/setup.json ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "rl_action": "train",
4
+ "model_type": "impala",
5
+ "lr": 5e-05,
6
+ "discount_rate": 0.98,
7
+ "num_rollout_steps": 64,
8
+ "grad_acc_per_chunk": 4,
9
+ "num_rollout_chunks": 1,
10
+ "cheese_loc": "any",
11
+ "env_layout": "open",
12
+ "alpha": 1.0,
13
+ "env_size": 13,
14
+ "num_levels": 9600,
15
+ "compile": true,
16
+ "use_prev_action": false,
17
+ "weight_restrictions": null,
18
+ "weight_restrictions_invert": false,
19
+ "use_bf16": false,
20
+ "use_wandb": true,
21
+ "seed": 42,
22
+ "mask_type": "first_episode",
23
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
24
+ "vis_average_state": false,
25
+ "trim_episodes": false,
26
+ "num_total_env_steps": 7372800000,
27
+ "eval_every": 1,
28
+ "eff_horizon": null,
29
+ "optim": "adam",
30
+ "env_rule": null,
31
+ "hf_user": "davidquarel",
32
+ "hf_collection": null,
33
+ "use_hf": true,
34
+ "num_hf_uploads": 1,
35
+ "use_log": true,
36
+ "log_optimizer_state": true,
37
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
38
+ "resume_id": 175,
39
+ "resume_optim": true,
40
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000",
41
+ "wandb_project": "jaxgmg2_patt",
42
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
43
+ "render_sixel": false,
44
+ "sixel_idx": 60,
45
+ "live_monitor": false,
46
+ "run_id": 0,
47
+ "seed_formula": null,
48
+ "deterministic": true,
49
+ "penalize_time": false,
50
+ "f_str_ckpt": null,
51
+ "duplication_factor": -1,
52
+ "smoke": false,
53
+ "ntfy": null,
54
+ "num_chains": 6,
55
+ "num_draws": 3000,
56
+ "num_steps_bw_draws": 1,
57
+ "on_policy": true,
58
+ "llc_nbeta": 3000,
59
+ "localization": 10,
60
+ "exact_solver_each_draw": false,
61
+ "llc_optimizer": "sgld",
62
+ "iw_clip_eps": null,
63
+ "rmsprop_burnin_steps": 20,
64
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
65
+ "llc_checkpoint_index": null,
66
+ "llc_checkpoint_number": null,
67
+ "sink": null,
68
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
69
+ "use_shuffled_checkpoints": false,
70
+ "force_re_download": false,
71
+ "off_distribution_data": false,
72
+ "evaluate_every_position": false,
73
+ "num_prev_actions": 1,
74
+ "eff_acc_steps": 4,
75
+ "chunk_size": 9600,
76
+ "env_steps_per_microbatch": 153600,
77
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000",
78
+ "env_steps_per_loop": 614400,
79
+ "total_loops": 12000,
80
+ "patt_mode": "mp-inv",
81
+ "patt_h": 0.0,
82
+ "patt_use_hmax": false,
83
+ "patt_t": 0,
84
+ "patt_cluster": "east",
85
+ "suscept_id": 2000,
86
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019"
87
+ },
88
+ "setup": {
89
+ "start_time_utc": "2026-03-05T17:07:16.119445Z",
90
+ "seed": 42,
91
+ "device": "cuda",
92
+ "python_version": "3.11.11",
93
+ "torch_version": "2.10.0+cu128",
94
+ "jax_version": "0.6.2",
95
+ "hostname": "8bab973d7ae6",
96
+ "platform": "Linux-6.8.0-58-lowlatency-x86_64-with-glibc2.39",
97
+ "git_sha": null,
98
+ "git_branch": null,
99
+ "use_wandb": true
100
+ }
101
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/setup.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ Start: 2026-03-05T17:07:16.119445Z
2
+ Seed: 42
3
+ Device: cuda
4
+ Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2
5
+ Host: 8bab973d7ae6
6
+ Platform: Linux-6.8.0-58-lowlatency-x86_64-with-glibc2.39
7
+ Git: branch=None sha=None
8
+ use_wandb: True
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/state_counts.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2e846ebe74d24c870871207d8d2f460d8355f6288e941990ee3766922f96e8
3
+ size 116288
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/train.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_175_sus_2000_seed_42/train.log ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/action_logprobs.pth.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85f4e47767f9f956f17d1498e8f1e9194b6b53fc14376d0cfc52d45b0da2a206
3
+ size 212852833
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/action_probs.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89020a8c6675a5734aaa5b598b4d73d9b6f0c287103b44fd62fbf2770018f7c2
3
+ size 148170086
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/checkpoints.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd94620d14e2c661a557d2a6eb4e28f55b49bb73fecd55914f37dce66c24a85c
3
+ size 1225714153
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/config.cfg ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ rl_action=train
2
+ model_type=impala
3
+ lr=5e-05
4
+ discount_rate=0.98
5
+ num_rollout_steps=64
6
+ grad_acc_per_chunk=4
7
+ num_rollout_chunks=1
8
+ cheese_loc=any
9
+ env_layout=open
10
+ alpha=1.0
11
+ env_size=13
12
+ num_levels=9600
13
+ compile=True
14
+ use_prev_action=False
15
+ weight_restrictions=None
16
+ weight_restrictions_invert=False
17
+ use_bf16=False
18
+ use_wandb=True
19
+ seed=42
20
+ mask_type=first_episode
21
+ ckpt_dir=jaxgmg2_3phase_optim_state_patt
22
+ vis_average_state=False
23
+ trim_episodes=False
24
+ num_total_env_steps=7372800000
25
+ eval_every=1
26
+ eff_horizon=None
27
+ optim=adam
28
+ env_rule=None
29
+ hf_user=davidquarel
30
+ hf_collection=None
31
+ use_hf=True
32
+ num_hf_uploads=1
33
+ use_log=True
34
+ log_optimizer_state=True
35
+ resume=jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
36
+ resume_id=264
37
+ resume_optim=True
38
+ checkpoint=al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000
39
+ wandb_project=jaxgmg2_patt
40
+ eval_schedule=0:1,250:2,500:5,2000:10
41
+ render_sixel=False
42
+ sixel_idx=60
43
+ live_monitor=False
44
+ run_id=0
45
+ seed_formula=None
46
+ deterministic=True
47
+ penalize_time=False
48
+ f_str_ckpt=None
49
+ duplication_factor=-1
50
+ smoke=False
51
+ ntfy=None
52
+ num_chains=6
53
+ num_draws=3000
54
+ num_steps_bw_draws=1
55
+ on_policy=True
56
+ llc_nbeta=3000
57
+ localization=10
58
+ exact_solver_each_draw=False
59
+ llc_optimizer=sgld
60
+ iw_clip_eps=None
61
+ rmsprop_burnin_steps=20
62
+ llc_data_file=llc_scan_open_reinforce.pkl
63
+ llc_checkpoint_index=None
64
+ llc_checkpoint_number=None
65
+ sink=None
66
+ repo_id=davidquarel/jaxgmg_ckpt_zip
67
+ use_shuffled_checkpoints=False
68
+ force_re_download=False
69
+ off_distribution_data=False
70
+ evaluate_every_position=False
71
+ num_prev_actions=1
72
+ eff_acc_steps=4
73
+ chunk_size=9600
74
+ env_steps_per_microbatch=153600
75
+ ckpt_path=jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000
76
+ env_steps_per_loop=614400
77
+ total_loops=12000
78
+ patt_mode=mp-inv
79
+ patt_h=0.0
80
+ patt_use_hmax=False
81
+ patt_t=0
82
+ patt_cluster=east
83
+ suscept_id=2000
84
+ model_id=al_1.0_g_0.98_id_19_seed_981019
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/config.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha": 1.0,
3
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000",
4
+ "cheese_loc": "any",
5
+ "chunk_size": 9600,
6
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
7
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000",
8
+ "compile": true,
9
+ "deterministic": true,
10
+ "discount_rate": 0.98,
11
+ "duplication_factor": -1,
12
+ "eff_acc_steps": 4,
13
+ "eff_horizon": null,
14
+ "env_layout": "open",
15
+ "env_rule": null,
16
+ "env_size": 13,
17
+ "env_steps_per_loop": 614400,
18
+ "env_steps_per_microbatch": 153600,
19
+ "eval_every": 1,
20
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
21
+ "evaluate_every_position": false,
22
+ "exact_solver_each_draw": false,
23
+ "f_str_ckpt": null,
24
+ "force_re_download": false,
25
+ "grad_acc_per_chunk": 4,
26
+ "hf_collection": null,
27
+ "hf_user": "davidquarel",
28
+ "iw_clip_eps": null,
29
+ "live_monitor": false,
30
+ "llc_checkpoint_index": null,
31
+ "llc_checkpoint_number": null,
32
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
33
+ "llc_nbeta": 3000,
34
+ "llc_optimizer": "sgld",
35
+ "localization": 10,
36
+ "log_optimizer_state": true,
37
+ "lr": 5e-05,
38
+ "mask_type": "first_episode",
39
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019",
40
+ "model_type": "impala",
41
+ "ntfy": null,
42
+ "num_chains": 6,
43
+ "num_draws": 3000,
44
+ "num_hf_uploads": 1,
45
+ "num_levels": 9600,
46
+ "num_prev_actions": 1,
47
+ "num_rollout_chunks": 1,
48
+ "num_rollout_steps": 64,
49
+ "num_steps_bw_draws": 1,
50
+ "num_total_env_steps": 7372800000,
51
+ "off_distribution_data": false,
52
+ "on_policy": true,
53
+ "optim": "adam",
54
+ "patt_cluster": "east",
55
+ "patt_h": 0.0,
56
+ "patt_mode": "mp-inv",
57
+ "patt_t": 0,
58
+ "patt_use_hmax": false,
59
+ "penalize_time": false,
60
+ "render_sixel": false,
61
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
62
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
63
+ "resume_id": 264,
64
+ "resume_optim": true,
65
+ "rl_action": "train",
66
+ "rmsprop_burnin_steps": 20,
67
+ "run_id": 0,
68
+ "seed": 42,
69
+ "seed_formula": null,
70
+ "sink": null,
71
+ "sixel_idx": 60,
72
+ "smoke": false,
73
+ "suscept_id": 2000,
74
+ "total_loops": 12000,
75
+ "trim_episodes": false,
76
+ "use_bf16": false,
77
+ "use_hf": true,
78
+ "use_log": true,
79
+ "use_prev_action": false,
80
+ "use_shuffled_checkpoints": false,
81
+ "use_wandb": true,
82
+ "vis_average_state": false,
83
+ "wandb_project": "jaxgmg2_patt",
84
+ "weight_restrictions": null,
85
+ "weight_restrictions_invert": false
86
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/eval.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/eval.log ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/latest_train.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2026-03-05T19:58:40.844448Z",
3
+ "loop": 11999,
4
+ "env_steps": 7372799999,
5
+ "loss": 0.026006359606981277,
6
+ "avg_return": 0.8824062347412109,
7
+ "regret": 0.0001295174442930147,
8
+ "entropy": 0.0964682549238205,
9
+ "lr": 5e-05,
10
+ "discount_rate": 0.98,
11
+ "num_rollout_steps": 64
12
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/optimizer_state.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b56a526b46df0b250f490cc60fee829a2e03403697534340ee2841a487813945
3
+ size 2215812545
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/patterning.log ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ============================================================
2
+ Patterning config summary
3
+ ============================================================
4
+ patt_mode: mp-inv
5
+ patt_h: 0.0
6
+ patt_cluster: east
7
+ alpha: 1.0
8
+ model_id: al_1.0_g_0.98_id_19_seed_981019
9
+ resume: jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
10
+ resume_id: 264
11
+ resume_optim: True
12
+ suscept_id: 2000
13
+ ckpt_path: jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000
14
+ smoke: False
15
+ ============================================================
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/setup.json ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "rl_action": "train",
4
+ "model_type": "impala",
5
+ "lr": 5e-05,
6
+ "discount_rate": 0.98,
7
+ "num_rollout_steps": 64,
8
+ "grad_acc_per_chunk": 4,
9
+ "num_rollout_chunks": 1,
10
+ "cheese_loc": "any",
11
+ "env_layout": "open",
12
+ "alpha": 1.0,
13
+ "env_size": 13,
14
+ "num_levels": 9600,
15
+ "compile": true,
16
+ "use_prev_action": false,
17
+ "weight_restrictions": null,
18
+ "weight_restrictions_invert": false,
19
+ "use_bf16": false,
20
+ "use_wandb": true,
21
+ "seed": 42,
22
+ "mask_type": "first_episode",
23
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
24
+ "vis_average_state": false,
25
+ "trim_episodes": false,
26
+ "num_total_env_steps": 7372800000,
27
+ "eval_every": 1,
28
+ "eff_horizon": null,
29
+ "optim": "adam",
30
+ "env_rule": null,
31
+ "hf_user": "davidquarel",
32
+ "hf_collection": null,
33
+ "use_hf": true,
34
+ "num_hf_uploads": 1,
35
+ "use_log": true,
36
+ "log_optimizer_state": true,
37
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
38
+ "resume_id": 264,
39
+ "resume_optim": true,
40
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000",
41
+ "wandb_project": "jaxgmg2_patt",
42
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
43
+ "render_sixel": false,
44
+ "sixel_idx": 60,
45
+ "live_monitor": false,
46
+ "run_id": 0,
47
+ "seed_formula": null,
48
+ "deterministic": true,
49
+ "penalize_time": false,
50
+ "f_str_ckpt": null,
51
+ "duplication_factor": -1,
52
+ "smoke": false,
53
+ "ntfy": null,
54
+ "num_chains": 6,
55
+ "num_draws": 3000,
56
+ "num_steps_bw_draws": 1,
57
+ "on_policy": true,
58
+ "llc_nbeta": 3000,
59
+ "localization": 10,
60
+ "exact_solver_each_draw": false,
61
+ "llc_optimizer": "sgld",
62
+ "iw_clip_eps": null,
63
+ "rmsprop_burnin_steps": 20,
64
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
65
+ "llc_checkpoint_index": null,
66
+ "llc_checkpoint_number": null,
67
+ "sink": null,
68
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
69
+ "use_shuffled_checkpoints": false,
70
+ "force_re_download": false,
71
+ "off_distribution_data": false,
72
+ "evaluate_every_position": false,
73
+ "num_prev_actions": 1,
74
+ "eff_acc_steps": 4,
75
+ "chunk_size": 9600,
76
+ "env_steps_per_microbatch": 153600,
77
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000",
78
+ "env_steps_per_loop": 614400,
79
+ "total_loops": 12000,
80
+ "patt_mode": "mp-inv",
81
+ "patt_h": 0.0,
82
+ "patt_use_hmax": false,
83
+ "patt_t": 0,
84
+ "patt_cluster": "east",
85
+ "suscept_id": 2000,
86
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019"
87
+ },
88
+ "setup": {
89
+ "start_time_utc": "2026-03-05T17:07:47.193146Z",
90
+ "seed": 42,
91
+ "device": "cuda",
92
+ "python_version": "3.11.11",
93
+ "torch_version": "2.10.0+cu128",
94
+ "jax_version": "0.6.2",
95
+ "hostname": "7ebec1ae3866",
96
+ "platform": "Linux-5.15.0-52-generic-x86_64-with-glibc2.39",
97
+ "git_sha": null,
98
+ "git_branch": null,
99
+ "use_wandb": true
100
+ }
101
+ }
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/setup.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ Start: 2026-03-05T17:07:47.193146Z
2
+ Seed: 42
3
+ Device: cuda
4
+ Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2
5
+ Host: 7ebec1ae3866
6
+ Platform: Linux-5.15.0-52-generic-x86_64-with-glibc2.39
7
+ Git: branch=None sha=None
8
+ use_wandb: True
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/state_counts.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2e846ebe74d24c870871207d8d2f460d8355f6288e941990ee3766922f96e8
3
+ size 116288
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/train.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.00_ld-opt_1_ckpt_264_sus_2000_seed_42/train.log ADDED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/action_logprobs.pth.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93d66960f540ee3617bafef55b6215e9c4e39fdbdb8457f233abe7c12deea26b
3
+ size 211439082
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/action_probs.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da9fe7e12f217e653d1b063a6c3cdbbf0eaa46f01050d75e591031c4b52b6d45
3
+ size 151304733
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/checkpoints.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e301d63e3587367d92e2e55cd8f49dca8278a94ded52cd8217ddd347a1e8bb8
3
+ size 1225647612
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/config.cfg ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ rl_action=train
2
+ model_type=impala
3
+ lr=5e-05
4
+ discount_rate=0.98
5
+ num_rollout_steps=64
6
+ grad_acc_per_chunk=4
7
+ num_rollout_chunks=1
8
+ cheese_loc=any
9
+ env_layout=open
10
+ alpha=1.0
11
+ env_size=13
12
+ num_levels=9600
13
+ compile=True
14
+ use_prev_action=False
15
+ weight_restrictions=None
16
+ weight_restrictions_invert=False
17
+ use_bf16=False
18
+ use_wandb=True
19
+ seed=42
20
+ mask_type=first_episode
21
+ ckpt_dir=jaxgmg2_3phase_optim_state_patt
22
+ vis_average_state=False
23
+ trim_episodes=False
24
+ num_total_env_steps=7372800000
25
+ eval_every=1
26
+ eff_horizon=None
27
+ optim=adam
28
+ env_rule=None
29
+ hf_user=davidquarel
30
+ hf_collection=None
31
+ use_hf=True
32
+ num_hf_uploads=1
33
+ use_log=True
34
+ log_optimizer_state=True
35
+ resume=jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019
36
+ resume_id=175
37
+ resume_optim=True
38
+ checkpoint=al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42
39
+ wandb_project=jaxgmg2_patt
40
+ eval_schedule=0:1,250:2,500:5,2000:10
41
+ render_sixel=False
42
+ sixel_idx=60
43
+ live_monitor=False
44
+ run_id=0
45
+ seed_formula=None
46
+ deterministic=True
47
+ penalize_time=False
48
+ f_str_ckpt=None
49
+ duplication_factor=-1
50
+ smoke=False
51
+ ntfy=None
52
+ num_chains=6
53
+ num_draws=3000
54
+ num_steps_bw_draws=1
55
+ on_policy=True
56
+ llc_nbeta=3000
57
+ localization=10
58
+ exact_solver_each_draw=False
59
+ llc_optimizer=sgld
60
+ iw_clip_eps=None
61
+ rmsprop_burnin_steps=20
62
+ llc_data_file=llc_scan_open_reinforce.pkl
63
+ llc_checkpoint_index=None
64
+ llc_checkpoint_number=None
65
+ sink=None
66
+ repo_id=davidquarel/jaxgmg_ckpt_zip
67
+ use_shuffled_checkpoints=False
68
+ force_re_download=False
69
+ off_distribution_data=False
70
+ evaluate_every_position=False
71
+ num_prev_actions=1
72
+ eff_acc_steps=4
73
+ chunk_size=9600
74
+ env_steps_per_microbatch=153600
75
+ ckpt_path=jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42
76
+ env_steps_per_loop=614400
77
+ total_loops=12000
78
+ patt_mode=mp-inv
79
+ patt_h=0.0
80
+ patt_use_hmax=False
81
+ patt_t=0.05
82
+ suscept_id=2000
83
+ model_id=al_1.0_g_0.98_id_19_seed_981019
al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42/config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha": 1.0,
3
+ "checkpoint": "al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42",
4
+ "cheese_loc": "any",
5
+ "chunk_size": 9600,
6
+ "ckpt_dir": "jaxgmg2_3phase_optim_state_patt",
7
+ "ckpt_path": "jaxgmg2_3phase_optim_state_patt/al_1.0_g_0.98_id_19_seed_981019/patt_mp-inv_t_0.05_ld-opt_1_ckpt_175_sus_2000_seed_42",
8
+ "compile": true,
9
+ "deterministic": true,
10
+ "discount_rate": 0.98,
11
+ "duplication_factor": -1,
12
+ "eff_acc_steps": 4,
13
+ "eff_horizon": null,
14
+ "env_layout": "open",
15
+ "env_rule": null,
16
+ "env_size": 13,
17
+ "env_steps_per_loop": 614400,
18
+ "env_steps_per_microbatch": 153600,
19
+ "eval_every": 1,
20
+ "eval_schedule": "0:1,250:2,500:5,2000:10",
21
+ "evaluate_every_position": false,
22
+ "exact_solver_each_draw": false,
23
+ "f_str_ckpt": null,
24
+ "force_re_download": false,
25
+ "grad_acc_per_chunk": 4,
26
+ "hf_collection": null,
27
+ "hf_user": "davidquarel",
28
+ "iw_clip_eps": null,
29
+ "live_monitor": false,
30
+ "llc_checkpoint_index": null,
31
+ "llc_checkpoint_number": null,
32
+ "llc_data_file": "llc_scan_open_reinforce.pkl",
33
+ "llc_nbeta": 3000,
34
+ "llc_optimizer": "sgld",
35
+ "localization": 10,
36
+ "log_optimizer_state": true,
37
+ "lr": 5e-05,
38
+ "mask_type": "first_episode",
39
+ "model_id": "al_1.0_g_0.98_id_19_seed_981019",
40
+ "model_type": "impala",
41
+ "ntfy": null,
42
+ "num_chains": 6,
43
+ "num_draws": 3000,
44
+ "num_hf_uploads": 1,
45
+ "num_levels": 9600,
46
+ "num_prev_actions": 1,
47
+ "num_rollout_chunks": 1,
48
+ "num_rollout_steps": 64,
49
+ "num_steps_bw_draws": 1,
50
+ "num_total_env_steps": 7372800000,
51
+ "off_distribution_data": false,
52
+ "on_policy": true,
53
+ "optim": "adam",
54
+ "patt_h": 0.0,
55
+ "patt_mode": "mp-inv",
56
+ "patt_t": 0.05,
57
+ "patt_use_hmax": false,
58
+ "penalize_time": false,
59
+ "render_sixel": false,
60
+ "repo_id": "davidquarel/jaxgmg_ckpt_zip",
61
+ "resume": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_19_seed_981019",
62
+ "resume_id": 175,
63
+ "resume_optim": true,
64
+ "rl_action": "train",
65
+ "rmsprop_burnin_steps": 20,
66
+ "run_id": 0,
67
+ "seed": 42,
68
+ "seed_formula": null,
69
+ "sink": null,
70
+ "sixel_idx": 60,
71
+ "smoke": false,
72
+ "suscept_id": 2000,
73
+ "total_loops": 12000,
74
+ "trim_episodes": false,
75
+ "use_bf16": false,
76
+ "use_hf": true,
77
+ "use_log": true,
78
+ "use_prev_action": false,
79
+ "use_shuffled_checkpoints": false,
80
+ "use_wandb": true,
81
+ "vis_average_state": false,
82
+ "wandb_project": "jaxgmg2_patt",
83
+ "weight_restrictions": null,
84
+ "weight_restrictions_invert": false
85
+ }