davidquarel commited on
Commit
b4535a7
·
verified ·
1 Parent(s): 4f2b9c0

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +4 -0
  2. adam_first_ep_g75/action_probs.zip +2 -2
  3. adam_first_ep_g75/checkpoints.zip +2 -2
  4. adam_first_ep_g75/eval.jsonl +0 -0
  5. adam_first_ep_g75/eval.log +0 -0
  6. adam_first_ep_g75/latest_eval.json +1 -1
  7. adam_first_ep_g75/latest_train.json +2 -2
  8. adam_first_ep_g75/policy_trace.mp4 +2 -2
  9. adam_first_ep_g75/setup.json +5 -5
  10. adam_first_ep_g75/setup.txt +5 -5
  11. adam_first_ep_g75/train.jsonl +0 -0
  12. adam_first_ep_g75/train.log +0 -0
  13. adam_first_ep_g8197/action_probs.zip +1 -1
  14. adam_first_ep_g8197/checkpoints.zip +1 -1
  15. adam_first_ep_g9513/action_probs.zip +3 -0
  16. adam_first_ep_g9513/checkpoints.zip +3 -0
  17. adam_first_ep_g9513/config.cfg +18 -0
  18. adam_first_ep_g9513/config.json +20 -0
  19. adam_first_ep_g9513/eval.jsonl +0 -0
  20. adam_first_ep_g9513/eval.log +0 -0
  21. adam_first_ep_g9513/latest_eval.json +9 -0
  22. adam_first_ep_g9513/latest_train.json +13 -0
  23. adam_first_ep_g9513/policy_trace.mp4 +3 -0
  24. adam_first_ep_g9513/setup.json +35 -0
  25. adam_first_ep_g9513/setup.txt +8 -0
  26. adam_first_ep_g9513/train.jsonl +0 -0
  27. adam_first_ep_g9513/train.log +0 -0
  28. adam_first_ep_g9868/action_probs.zip +3 -0
  29. adam_first_ep_g9868/checkpoints.zip +3 -0
  30. adam_first_ep_g9868/config.cfg +18 -0
  31. adam_first_ep_g9868/config.json +20 -0
  32. adam_first_ep_g9868/eval.jsonl +0 -0
  33. adam_first_ep_g9868/eval.log +0 -0
  34. adam_first_ep_g9868/latest_eval.json +9 -0
  35. adam_first_ep_g9868/latest_train.json +13 -0
  36. adam_first_ep_g9868/policy_trace.mp4 +3 -0
  37. adam_first_ep_g9868/setup.json +35 -0
  38. adam_first_ep_g9868/setup.txt +8 -0
  39. adam_first_ep_g9868/train.jsonl +0 -0
  40. adam_first_ep_g9868/train.log +0 -0
  41. adam_first_ep_g9964/action_probs.zip +3 -0
  42. adam_first_ep_g9964/checkpoints.zip +3 -0
  43. adam_first_ep_g9964/config.cfg +18 -0
  44. adam_first_ep_g9964/config.json +20 -0
  45. adam_first_ep_g9964/eval.jsonl +0 -0
  46. adam_first_ep_g9964/eval.log +0 -0
  47. adam_first_ep_g9964/latest_eval.json +9 -0
  48. adam_first_ep_g9964/latest_train.json +13 -0
  49. adam_first_ep_g9964/policy_trace.mp4 +3 -0
  50. adam_first_ep_g9964/setup.json +35 -0
.gitattributes CHANGED
@@ -57,3 +57,7 @@ adam_first_ep_g9649/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
57
  adam_first_ep_g9905/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
58
  adam_first_ep_g9974/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
59
  adam_first_ep_g9993/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
57
  adam_first_ep_g9905/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
58
  adam_first_ep_g9974/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
59
  adam_first_ep_g9993/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
60
+ adam_first_ep_g9513/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
61
+ adam_first_ep_g9868/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
62
+ adam_first_ep_g9964/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
63
+ adam_first_ep_g999/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
adam_first_ep_g75/action_probs.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a4dc05102a56e3012ca773a6802f3938ab7ec7ede4aa19605ed266f5bf5e3d8
3
- size 1499323
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b29a462137df46825beab15a49f00032a68fa45e893140d7937c2f60838711e2
3
+ size 1500852
adam_first_ep_g75/checkpoints.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:695ca13e9afc45800b5bd2069066b69ace77611ab0d42b30e7389460d9624e74
3
- size 1547615088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2625e1a7d20e7ead54f1333e829eb081a779134a8ccf096859d195382808dbd9
3
+ size 1547775746
adam_first_ep_g75/eval.jsonl CHANGED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g75/eval.log CHANGED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g75/latest_eval.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "ts": "2025-09-22T22:28:03.652332Z",
3
  "loop": 32540,
4
  "env_steps": 4998144000,
5
  "exact_value_avg": 0.1519668698310852,
 
1
  {
2
+ "ts": "2025-09-22T14:27:13.675723Z",
3
  "loop": 32540,
4
  "env_steps": 4998144000,
5
  "exact_value_avg": 0.1519668698310852,
adam_first_ep_g75/latest_train.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "ts": "2025-09-22T22:28:08.290182Z",
3
  "loop": 32551,
4
  "env_steps": 4999987200,
5
  "loss": -0.0,
6
  "avg_return": 0.15196684002876282,
7
  "regret": 0.0,
8
- "entropy": 1.5960644361712184e-08,
9
  "lr": 5e-05,
10
  "discount_rate": 0.75,
11
  "duplication_factor": 20,
 
1
  {
2
+ "ts": "2025-09-22T14:27:18.241482Z",
3
  "loop": 32551,
4
  "env_steps": 4999987200,
5
  "loss": -0.0,
6
  "avg_return": 0.15196684002876282,
7
  "regret": 0.0,
8
+ "entropy": 1.3763517436871098e-08,
9
  "lr": 5e-05,
10
  "discount_rate": 0.75,
11
  "duplication_factor": 20,
adam_first_ep_g75/policy_trace.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:829a3316a1bf18d6c1faea06a30138d8810371cdfc1cbf720a6659cbf0a1e2b8
3
- size 256680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdc79281caae9c6fb2361684c81ebbe719376c052c5338d34f0cb95db9e65b6a
3
+ size 263845
adam_first_ep_g75/setup.json CHANGED
@@ -20,15 +20,15 @@
20
  "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
21
  },
22
  "setup": {
23
- "start_time_utc": "2025-09-22T18:45:01.160505Z",
24
  "seed": 42,
25
  "device": "cuda",
26
  "python_version": "3.11.11",
27
- "torch_version": "2.10.0.dev20250921+cu126",
28
  "jax_version": "0.6.2",
29
- "hostname": "68d07fcf6382",
30
- "platform": "Linux-5.15.0-151-generic-x86_64-with-glibc2.35",
31
- "git_sha": "d957ce0d8d58615ff31dc985c5bc0720980f7b36",
32
  "git_branch": "rl/main",
33
  "use_wandb": false
34
  }
 
20
  "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
21
  },
22
  "setup": {
23
+ "start_time_utc": "2025-09-22T10:50:06.914562Z",
24
  "seed": 42,
25
  "device": "cuda",
26
  "python_version": "3.11.11",
27
+ "torch_version": "2.7.0+cu126",
28
  "jax_version": "0.6.2",
29
+ "hostname": "cc99e999c817",
30
+ "platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
31
+ "git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
32
  "git_branch": "rl/main",
33
  "use_wandb": false
34
  }
adam_first_ep_g75/setup.txt CHANGED
@@ -1,8 +1,8 @@
1
- Start: 2025-09-22T18:45:01.160505Z
2
  Seed: 42
3
  Device: cuda
4
- Python: 3.11.11 | Torch: 2.10.0.dev20250921+cu126 | JAX: 0.6.2
5
- Host: 68d07fcf6382
6
- Platform: Linux-5.15.0-151-generic-x86_64-with-glibc2.35
7
- Git: branch=rl/main sha=d957ce0d8d58615ff31dc985c5bc0720980f7b36
8
  use_wandb: False
 
1
+ Start: 2025-09-22T10:50:06.914562Z
2
  Seed: 42
3
  Device: cuda
4
+ Python: 3.11.11 | Torch: 2.7.0+cu126 | JAX: 0.6.2
5
+ Host: cc99e999c817
6
+ Platform: Linux-5.15.0-88-generic-x86_64-with-glibc2.35
7
+ Git: branch=rl/main sha=0cf8df44bc95b6408d52e80dc2ef4a758a405a91
8
  use_wandb: False
adam_first_ep_g75/train.jsonl CHANGED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g75/train.log CHANGED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g8197/action_probs.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:700fa00d6129f1594833a9c38285321eca30061cd8ae3ac9f5c3500c2c333c15
3
  size 1517192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:618c7f4712c4d4c0a94d310726cc6f66b58c68d52ec2d69b10cdc901d7730e79
3
  size 1517192
adam_first_ep_g8197/checkpoints.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccf2c74c4b824bd415835015b1f6d71d6abb6f40a9fbd1c9e74dab496af6e80d
3
  size 1547483646
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cdad3e38dd740e486a5ebc33cf39cd4f949146febb63e156db0039f0a79d4d7
3
  size 1547483646
adam_first_ep_g9513/action_probs.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aca3dedf6dcfe7a2a1207a0f6e7734b266739dd99d4d7a452b21200da96515a1
3
+ size 1734748
adam_first_ep_g9513/checkpoints.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b40fd13f6cf82f2c4267aafdd8a1f25c7b91b12c14311fccef489a75d5899b5
3
+ size 1547420280
adam_first_ep_g9513/config.cfg ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ num_rollout_steps=64
2
+ lr=5e-05
3
+ discount_rate=0.9513
4
+ eff_horizon=None
5
+ eval_every=10
6
+ duplication_factor=20
7
+ use_wandb=False
8
+ num_total_env_steps=5000000000
9
+ checkpoint=adam_first_ep_g9513
10
+ num_levels=None
11
+ render_sixel=False
12
+ seed=42
13
+ mask_type=first_episode
14
+ penalize_time=False
15
+ corner_size=1
16
+ optim=adam
17
+ live_monitor=True
18
+ checkpoint_schedule=0:1,250:2,500:5,1000:10,2000:20
adam_first_ep_g9513/config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint": "adam_first_ep_g9513",
3
+ "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20",
4
+ "corner_size": 1,
5
+ "discount_rate": 0.9513,
6
+ "duplication_factor": 20,
7
+ "eff_horizon": null,
8
+ "eval_every": 10,
9
+ "live_monitor": true,
10
+ "lr": 5e-05,
11
+ "mask_type": "first_episode",
12
+ "num_levels": null,
13
+ "num_rollout_steps": 64,
14
+ "num_total_env_steps": 5000000000,
15
+ "optim": "adam",
16
+ "penalize_time": false,
17
+ "render_sixel": false,
18
+ "seed": 42,
19
+ "use_wandb": false
20
+ }
adam_first_ep_g9513/eval.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9513/eval.log ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9513/latest_eval.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2025-09-23T02:04:47.760339Z",
3
+ "loop": 32540,
4
+ "env_steps": 4998144000,
5
+ "exact_value_avg": 0.6508079767227173,
6
+ "regret": 5.960464477539063e-08,
7
+ "exact_optimal_return": 0.6508080363273621,
8
+ "action_probs_image_path": "jaxgmg_ckpt_pt/adam_first_ep_g9513/action_probs/img_32540.png"
9
+ }
adam_first_ep_g9513/latest_train.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2025-09-23T02:04:52.287214Z",
3
+ "loop": 32551,
4
+ "env_steps": 4999987200,
5
+ "loss": 6.763982582924655e-07,
6
+ "avg_return": 0.6508080363273621,
7
+ "regret": 5.960464477539063e-08,
8
+ "entropy": 4.164845449849963e-05,
9
+ "lr": 5e-05,
10
+ "discount_rate": 0.9513,
11
+ "duplication_factor": 20,
12
+ "num_rollout_steps": 64
13
+ }
adam_first_ep_g9513/policy_trace.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0f3c7dceb6b3bb7e64dc2c47727d8cd2da3bb563cab3fa1ea5b58189d6f0eb5
3
+ size 323534
adam_first_ep_g9513/setup.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "num_rollout_steps": 64,
4
+ "lr": 5e-05,
5
+ "discount_rate": 0.9513,
6
+ "eff_horizon": null,
7
+ "eval_every": 10,
8
+ "duplication_factor": 20,
9
+ "use_wandb": false,
10
+ "num_total_env_steps": 5000000000,
11
+ "checkpoint": "adam_first_ep_g9513",
12
+ "num_levels": null,
13
+ "render_sixel": false,
14
+ "seed": 42,
15
+ "mask_type": "first_episode",
16
+ "penalize_time": false,
17
+ "corner_size": 1,
18
+ "optim": "adam",
19
+ "live_monitor": true,
20
+ "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
21
+ },
22
+ "setup": {
23
+ "start_time_utc": "2025-09-22T22:27:03.078571Z",
24
+ "seed": 42,
25
+ "device": "cuda",
26
+ "python_version": "3.11.11",
27
+ "torch_version": "2.7.0+cu126",
28
+ "jax_version": "0.6.2",
29
+ "hostname": "cc99e999c817",
30
+ "platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
31
+ "git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
32
+ "git_branch": "rl/main",
33
+ "use_wandb": false
34
+ }
35
+ }
adam_first_ep_g9513/setup.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ Start: 2025-09-22T22:27:03.078571Z
2
+ Seed: 42
3
+ Device: cuda
4
+ Python: 3.11.11 | Torch: 2.7.0+cu126 | JAX: 0.6.2
5
+ Host: cc99e999c817
6
+ Platform: Linux-5.15.0-88-generic-x86_64-with-glibc2.35
7
+ Git: branch=rl/main sha=0cf8df44bc95b6408d52e80dc2ef4a758a405a91
8
+ use_wandb: False
adam_first_ep_g9513/train.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9513/train.log ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9868/action_probs.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92322d73f0ed3e29149b6154bd8c4c6c5ba896e52f2b57f853f8cc6f3632a2e7
3
+ size 1574159
adam_first_ep_g9868/checkpoints.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3ae51df9cf7dc49e223e0407396579dbd68ee4842493721d7d552a4aa244a88
3
+ size 1547657682
adam_first_ep_g9868/config.cfg ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ num_rollout_steps=64
2
+ lr=5e-05
3
+ discount_rate=0.9868
4
+ eff_horizon=None
5
+ eval_every=10
6
+ duplication_factor=20
7
+ use_wandb=False
8
+ num_total_env_steps=5000000000
9
+ checkpoint=adam_first_ep_g9868
10
+ num_levels=None
11
+ render_sixel=False
12
+ seed=42
13
+ mask_type=first_episode
14
+ penalize_time=False
15
+ corner_size=1
16
+ optim=adam
17
+ live_monitor=True
18
+ checkpoint_schedule=0:1,250:2,500:5,1000:10,2000:20
adam_first_ep_g9868/config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint": "adam_first_ep_g9868",
3
+ "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20",
4
+ "corner_size": 1,
5
+ "discount_rate": 0.9868,
6
+ "duplication_factor": 20,
7
+ "eff_horizon": null,
8
+ "eval_every": 10,
9
+ "live_monitor": true,
10
+ "lr": 5e-05,
11
+ "mask_type": "first_episode",
12
+ "num_levels": null,
13
+ "num_rollout_steps": 64,
14
+ "num_total_env_steps": 5000000000,
15
+ "optim": "adam",
16
+ "penalize_time": false,
17
+ "render_sixel": false,
18
+ "seed": 42,
19
+ "use_wandb": false
20
+ }
adam_first_ep_g9868/eval.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9868/eval.log ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9868/latest_eval.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2025-09-23T05:46:34.424210Z",
3
+ "loop": 32540,
4
+ "env_steps": 4998144000,
5
+ "exact_value_avg": 0.8878134489059448,
6
+ "regret": 0.0,
7
+ "exact_optimal_return": 0.8878134489059448,
8
+ "action_probs_image_path": "jaxgmg_ckpt_pt/adam_first_ep_g9868/action_probs/img_32540.png"
9
+ }
adam_first_ep_g9868/latest_train.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2025-09-23T05:46:38.964333Z",
3
+ "loop": 32551,
4
+ "env_steps": 4999987200,
5
+ "loss": 1.096579563264477e-10,
6
+ "avg_return": 0.8878134489059448,
7
+ "regret": 0.0,
8
+ "entropy": 3.708085216658219e-08,
9
+ "lr": 5e-05,
10
+ "discount_rate": 0.9868,
11
+ "duplication_factor": 20,
12
+ "num_rollout_steps": 64
13
+ }
adam_first_ep_g9868/policy_trace.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:460ee0e5281b293de1ed209432b452e128c50ba862988de42593b8e0bd45a6db
3
+ size 301478
adam_first_ep_g9868/setup.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "num_rollout_steps": 64,
4
+ "lr": 5e-05,
5
+ "discount_rate": 0.9868,
6
+ "eff_horizon": null,
7
+ "eval_every": 10,
8
+ "duplication_factor": 20,
9
+ "use_wandb": false,
10
+ "num_total_env_steps": 5000000000,
11
+ "checkpoint": "adam_first_ep_g9868",
12
+ "num_levels": null,
13
+ "render_sixel": false,
14
+ "seed": 42,
15
+ "mask_type": "first_episode",
16
+ "penalize_time": false,
17
+ "corner_size": 1,
18
+ "optim": "adam",
19
+ "live_monitor": true,
20
+ "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
21
+ },
22
+ "setup": {
23
+ "start_time_utc": "2025-09-23T02:09:04.013196Z",
24
+ "seed": 42,
25
+ "device": "cuda",
26
+ "python_version": "3.11.11",
27
+ "torch_version": "2.7.0+cu126",
28
+ "jax_version": "0.6.2",
29
+ "hostname": "cc99e999c817",
30
+ "platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
31
+ "git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
32
+ "git_branch": "rl/main",
33
+ "use_wandb": false
34
+ }
35
+ }
adam_first_ep_g9868/setup.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ Start: 2025-09-23T02:09:04.013196Z
2
+ Seed: 42
3
+ Device: cuda
4
+ Python: 3.11.11 | Torch: 2.7.0+cu126 | JAX: 0.6.2
5
+ Host: cc99e999c817
6
+ Platform: Linux-5.15.0-88-generic-x86_64-with-glibc2.35
7
+ Git: branch=rl/main sha=0cf8df44bc95b6408d52e80dc2ef4a758a405a91
8
+ use_wandb: False
adam_first_ep_g9868/train.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9868/train.log ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9964/action_probs.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1d011009d2e8c6a49ebc070b4e1b1bd928adfe94b2b80882c4ba911dc99ba11
3
+ size 1989878
adam_first_ep_g9964/checkpoints.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6296ec57625aa728e4b6ab43124511be0de2e005d66232943c09c526071e4d44
3
+ size 1547268470
adam_first_ep_g9964/config.cfg ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ num_rollout_steps=64
2
+ lr=5e-05
3
+ discount_rate=0.9964
4
+ eff_horizon=None
5
+ eval_every=10
6
+ duplication_factor=20
7
+ use_wandb=False
8
+ num_total_env_steps=5000000000
9
+ checkpoint=adam_first_ep_g9964
10
+ num_levels=None
11
+ render_sixel=False
12
+ seed=42
13
+ mask_type=first_episode
14
+ penalize_time=False
15
+ corner_size=1
16
+ optim=adam
17
+ live_monitor=True
18
+ checkpoint_schedule=0:1,250:2,500:5,1000:10,2000:20
adam_first_ep_g9964/config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint": "adam_first_ep_g9964",
3
+ "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20",
4
+ "corner_size": 1,
5
+ "discount_rate": 0.9964,
6
+ "duplication_factor": 20,
7
+ "eff_horizon": null,
8
+ "eval_every": 10,
9
+ "live_monitor": true,
10
+ "lr": 5e-05,
11
+ "mask_type": "first_episode",
12
+ "num_levels": null,
13
+ "num_rollout_steps": 64,
14
+ "num_total_env_steps": 5000000000,
15
+ "optim": "adam",
16
+ "penalize_time": false,
17
+ "render_sixel": false,
18
+ "seed": 42,
19
+ "use_wandb": false
20
+ }
adam_first_ep_g9964/eval.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9964/eval.log ADDED
The diff for this file is too large to render. See raw diff
 
adam_first_ep_g9964/latest_eval.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2025-09-23T09:28:44.224525Z",
3
+ "loop": 32540,
4
+ "env_steps": 4998144000,
5
+ "exact_value_avg": 0.9678743481636047,
6
+ "regret": 1.9073486328125e-05,
7
+ "exact_optimal_return": 0.9678934216499329,
8
+ "action_probs_image_path": "jaxgmg_ckpt_pt/adam_first_ep_g9964/action_probs/img_32540.png"
9
+ }
adam_first_ep_g9964/latest_train.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ts": "2025-09-23T09:28:48.788429Z",
3
+ "loop": 32551,
4
+ "env_steps": 4999987200,
5
+ "loss": 0.0012626618845388293,
6
+ "avg_return": 0.967880368232727,
7
+ "regret": 1.9073486328125e-05,
8
+ "entropy": 0.008353522047400475,
9
+ "lr": 5e-05,
10
+ "discount_rate": 0.9964,
11
+ "duplication_factor": 20,
12
+ "num_rollout_steps": 64
13
+ }
adam_first_ep_g9964/policy_trace.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8beb4b71b991fb0fe383fae857903794bca5b868081b918e468f7bc32ce4f4e
3
+ size 402139
adam_first_ep_g9964/setup.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "num_rollout_steps": 64,
4
+ "lr": 5e-05,
5
+ "discount_rate": 0.9964,
6
+ "eff_horizon": null,
7
+ "eval_every": 10,
8
+ "duplication_factor": 20,
9
+ "use_wandb": false,
10
+ "num_total_env_steps": 5000000000,
11
+ "checkpoint": "adam_first_ep_g9964",
12
+ "num_levels": null,
13
+ "render_sixel": false,
14
+ "seed": 42,
15
+ "mask_type": "first_episode",
16
+ "penalize_time": false,
17
+ "corner_size": 1,
18
+ "optim": "adam",
19
+ "live_monitor": true,
20
+ "checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
21
+ },
22
+ "setup": {
23
+ "start_time_utc": "2025-09-23T05:50:58.197276Z",
24
+ "seed": 42,
25
+ "device": "cuda",
26
+ "python_version": "3.11.11",
27
+ "torch_version": "2.7.0+cu126",
28
+ "jax_version": "0.6.2",
29
+ "hostname": "cc99e999c817",
30
+ "platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
31
+ "git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
32
+ "git_branch": "rl/main",
33
+ "use_wandb": false
34
+ }
35
+ }