Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +4 -0
- adam_first_ep_g75/action_probs.zip +2 -2
- adam_first_ep_g75/checkpoints.zip +2 -2
- adam_first_ep_g75/eval.jsonl +0 -0
- adam_first_ep_g75/eval.log +0 -0
- adam_first_ep_g75/latest_eval.json +1 -1
- adam_first_ep_g75/latest_train.json +2 -2
- adam_first_ep_g75/policy_trace.mp4 +2 -2
- adam_first_ep_g75/setup.json +5 -5
- adam_first_ep_g75/setup.txt +5 -5
- adam_first_ep_g75/train.jsonl +0 -0
- adam_first_ep_g75/train.log +0 -0
- adam_first_ep_g8197/action_probs.zip +1 -1
- adam_first_ep_g8197/checkpoints.zip +1 -1
- adam_first_ep_g9513/action_probs.zip +3 -0
- adam_first_ep_g9513/checkpoints.zip +3 -0
- adam_first_ep_g9513/config.cfg +18 -0
- adam_first_ep_g9513/config.json +20 -0
- adam_first_ep_g9513/eval.jsonl +0 -0
- adam_first_ep_g9513/eval.log +0 -0
- adam_first_ep_g9513/latest_eval.json +9 -0
- adam_first_ep_g9513/latest_train.json +13 -0
- adam_first_ep_g9513/policy_trace.mp4 +3 -0
- adam_first_ep_g9513/setup.json +35 -0
- adam_first_ep_g9513/setup.txt +8 -0
- adam_first_ep_g9513/train.jsonl +0 -0
- adam_first_ep_g9513/train.log +0 -0
- adam_first_ep_g9868/action_probs.zip +3 -0
- adam_first_ep_g9868/checkpoints.zip +3 -0
- adam_first_ep_g9868/config.cfg +18 -0
- adam_first_ep_g9868/config.json +20 -0
- adam_first_ep_g9868/eval.jsonl +0 -0
- adam_first_ep_g9868/eval.log +0 -0
- adam_first_ep_g9868/latest_eval.json +9 -0
- adam_first_ep_g9868/latest_train.json +13 -0
- adam_first_ep_g9868/policy_trace.mp4 +3 -0
- adam_first_ep_g9868/setup.json +35 -0
- adam_first_ep_g9868/setup.txt +8 -0
- adam_first_ep_g9868/train.jsonl +0 -0
- adam_first_ep_g9868/train.log +0 -0
- adam_first_ep_g9964/action_probs.zip +3 -0
- adam_first_ep_g9964/checkpoints.zip +3 -0
- adam_first_ep_g9964/config.cfg +18 -0
- adam_first_ep_g9964/config.json +20 -0
- adam_first_ep_g9964/eval.jsonl +0 -0
- adam_first_ep_g9964/eval.log +0 -0
- adam_first_ep_g9964/latest_eval.json +9 -0
- adam_first_ep_g9964/latest_train.json +13 -0
- adam_first_ep_g9964/policy_trace.mp4 +3 -0
- adam_first_ep_g9964/setup.json +35 -0
.gitattributes
CHANGED
|
@@ -57,3 +57,7 @@ adam_first_ep_g9649/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
|
| 57 |
adam_first_ep_g9905/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 58 |
adam_first_ep_g9974/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 59 |
adam_first_ep_g9993/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 57 |
adam_first_ep_g9905/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 58 |
adam_first_ep_g9974/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 59 |
adam_first_ep_g9993/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
adam_first_ep_g9513/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
adam_first_ep_g9868/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
adam_first_ep_g9964/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
adam_first_ep_g999/policy_trace.mp4 filter=lfs diff=lfs merge=lfs -text
|
adam_first_ep_g75/action_probs.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b29a462137df46825beab15a49f00032a68fa45e893140d7937c2f60838711e2
|
| 3 |
+
size 1500852
|
adam_first_ep_g75/checkpoints.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2625e1a7d20e7ead54f1333e829eb081a779134a8ccf096859d195382808dbd9
|
| 3 |
+
size 1547775746
|
adam_first_ep_g75/eval.jsonl
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g75/eval.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g75/latest_eval.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"ts": "2025-09-
|
| 3 |
"loop": 32540,
|
| 4 |
"env_steps": 4998144000,
|
| 5 |
"exact_value_avg": 0.1519668698310852,
|
|
|
|
| 1 |
{
|
| 2 |
+
"ts": "2025-09-22T14:27:13.675723Z",
|
| 3 |
"loop": 32540,
|
| 4 |
"env_steps": 4998144000,
|
| 5 |
"exact_value_avg": 0.1519668698310852,
|
adam_first_ep_g75/latest_train.json
CHANGED
|
@@ -1,11 +1,11 @@
|
|
| 1 |
{
|
| 2 |
-
"ts": "2025-09-
|
| 3 |
"loop": 32551,
|
| 4 |
"env_steps": 4999987200,
|
| 5 |
"loss": -0.0,
|
| 6 |
"avg_return": 0.15196684002876282,
|
| 7 |
"regret": 0.0,
|
| 8 |
-
"entropy": 1.
|
| 9 |
"lr": 5e-05,
|
| 10 |
"discount_rate": 0.75,
|
| 11 |
"duplication_factor": 20,
|
|
|
|
| 1 |
{
|
| 2 |
+
"ts": "2025-09-22T14:27:18.241482Z",
|
| 3 |
"loop": 32551,
|
| 4 |
"env_steps": 4999987200,
|
| 5 |
"loss": -0.0,
|
| 6 |
"avg_return": 0.15196684002876282,
|
| 7 |
"regret": 0.0,
|
| 8 |
+
"entropy": 1.3763517436871098e-08,
|
| 9 |
"lr": 5e-05,
|
| 10 |
"discount_rate": 0.75,
|
| 11 |
"duplication_factor": 20,
|
adam_first_ep_g75/policy_trace.mp4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdc79281caae9c6fb2361684c81ebbe719376c052c5338d34f0cb95db9e65b6a
|
| 3 |
+
size 263845
|
adam_first_ep_g75/setup.json
CHANGED
|
@@ -20,15 +20,15 @@
|
|
| 20 |
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
|
| 21 |
},
|
| 22 |
"setup": {
|
| 23 |
-
"start_time_utc": "2025-09-
|
| 24 |
"seed": 42,
|
| 25 |
"device": "cuda",
|
| 26 |
"python_version": "3.11.11",
|
| 27 |
-
"torch_version": "2.
|
| 28 |
"jax_version": "0.6.2",
|
| 29 |
-
"hostname": "
|
| 30 |
-
"platform": "Linux-5.15.0-
|
| 31 |
-
"git_sha": "
|
| 32 |
"git_branch": "rl/main",
|
| 33 |
"use_wandb": false
|
| 34 |
}
|
|
|
|
| 20 |
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
|
| 21 |
},
|
| 22 |
"setup": {
|
| 23 |
+
"start_time_utc": "2025-09-22T10:50:06.914562Z",
|
| 24 |
"seed": 42,
|
| 25 |
"device": "cuda",
|
| 26 |
"python_version": "3.11.11",
|
| 27 |
+
"torch_version": "2.7.0+cu126",
|
| 28 |
"jax_version": "0.6.2",
|
| 29 |
+
"hostname": "cc99e999c817",
|
| 30 |
+
"platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
|
| 31 |
+
"git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
|
| 32 |
"git_branch": "rl/main",
|
| 33 |
"use_wandb": false
|
| 34 |
}
|
adam_first_ep_g75/setup.txt
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
-
Start: 2025-09-
|
| 2 |
Seed: 42
|
| 3 |
Device: cuda
|
| 4 |
-
Python: 3.11.11 | Torch: 2.
|
| 5 |
-
Host:
|
| 6 |
-
Platform: Linux-5.15.0-
|
| 7 |
-
Git: branch=rl/main sha=
|
| 8 |
use_wandb: False
|
|
|
|
| 1 |
+
Start: 2025-09-22T10:50:06.914562Z
|
| 2 |
Seed: 42
|
| 3 |
Device: cuda
|
| 4 |
+
Python: 3.11.11 | Torch: 2.7.0+cu126 | JAX: 0.6.2
|
| 5 |
+
Host: cc99e999c817
|
| 6 |
+
Platform: Linux-5.15.0-88-generic-x86_64-with-glibc2.35
|
| 7 |
+
Git: branch=rl/main sha=0cf8df44bc95b6408d52e80dc2ef4a758a405a91
|
| 8 |
use_wandb: False
|
adam_first_ep_g75/train.jsonl
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g75/train.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g8197/action_probs.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1517192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:618c7f4712c4d4c0a94d310726cc6f66b58c68d52ec2d69b10cdc901d7730e79
|
| 3 |
size 1517192
|
adam_first_ep_g8197/checkpoints.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1547483646
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cdad3e38dd740e486a5ebc33cf39cd4f949146febb63e156db0039f0a79d4d7
|
| 3 |
size 1547483646
|
adam_first_ep_g9513/action_probs.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aca3dedf6dcfe7a2a1207a0f6e7734b266739dd99d4d7a452b21200da96515a1
|
| 3 |
+
size 1734748
|
adam_first_ep_g9513/checkpoints.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b40fd13f6cf82f2c4267aafdd8a1f25c7b91b12c14311fccef489a75d5899b5
|
| 3 |
+
size 1547420280
|
adam_first_ep_g9513/config.cfg
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
num_rollout_steps=64
|
| 2 |
+
lr=5e-05
|
| 3 |
+
discount_rate=0.9513
|
| 4 |
+
eff_horizon=None
|
| 5 |
+
eval_every=10
|
| 6 |
+
duplication_factor=20
|
| 7 |
+
use_wandb=False
|
| 8 |
+
num_total_env_steps=5000000000
|
| 9 |
+
checkpoint=adam_first_ep_g9513
|
| 10 |
+
num_levels=None
|
| 11 |
+
render_sixel=False
|
| 12 |
+
seed=42
|
| 13 |
+
mask_type=first_episode
|
| 14 |
+
penalize_time=False
|
| 15 |
+
corner_size=1
|
| 16 |
+
optim=adam
|
| 17 |
+
live_monitor=True
|
| 18 |
+
checkpoint_schedule=0:1,250:2,500:5,1000:10,2000:20
|
adam_first_ep_g9513/config.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"checkpoint": "adam_first_ep_g9513",
|
| 3 |
+
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20",
|
| 4 |
+
"corner_size": 1,
|
| 5 |
+
"discount_rate": 0.9513,
|
| 6 |
+
"duplication_factor": 20,
|
| 7 |
+
"eff_horizon": null,
|
| 8 |
+
"eval_every": 10,
|
| 9 |
+
"live_monitor": true,
|
| 10 |
+
"lr": 5e-05,
|
| 11 |
+
"mask_type": "first_episode",
|
| 12 |
+
"num_levels": null,
|
| 13 |
+
"num_rollout_steps": 64,
|
| 14 |
+
"num_total_env_steps": 5000000000,
|
| 15 |
+
"optim": "adam",
|
| 16 |
+
"penalize_time": false,
|
| 17 |
+
"render_sixel": false,
|
| 18 |
+
"seed": 42,
|
| 19 |
+
"use_wandb": false
|
| 20 |
+
}
|
adam_first_ep_g9513/eval.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9513/eval.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9513/latest_eval.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ts": "2025-09-23T02:04:47.760339Z",
|
| 3 |
+
"loop": 32540,
|
| 4 |
+
"env_steps": 4998144000,
|
| 5 |
+
"exact_value_avg": 0.6508079767227173,
|
| 6 |
+
"regret": 5.960464477539063e-08,
|
| 7 |
+
"exact_optimal_return": 0.6508080363273621,
|
| 8 |
+
"action_probs_image_path": "jaxgmg_ckpt_pt/adam_first_ep_g9513/action_probs/img_32540.png"
|
| 9 |
+
}
|
adam_first_ep_g9513/latest_train.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ts": "2025-09-23T02:04:52.287214Z",
|
| 3 |
+
"loop": 32551,
|
| 4 |
+
"env_steps": 4999987200,
|
| 5 |
+
"loss": 6.763982582924655e-07,
|
| 6 |
+
"avg_return": 0.6508080363273621,
|
| 7 |
+
"regret": 5.960464477539063e-08,
|
| 8 |
+
"entropy": 4.164845449849963e-05,
|
| 9 |
+
"lr": 5e-05,
|
| 10 |
+
"discount_rate": 0.9513,
|
| 11 |
+
"duplication_factor": 20,
|
| 12 |
+
"num_rollout_steps": 64
|
| 13 |
+
}
|
adam_first_ep_g9513/policy_trace.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0f3c7dceb6b3bb7e64dc2c47727d8cd2da3bb563cab3fa1ea5b58189d6f0eb5
|
| 3 |
+
size 323534
|
adam_first_ep_g9513/setup.json
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"config": {
|
| 3 |
+
"num_rollout_steps": 64,
|
| 4 |
+
"lr": 5e-05,
|
| 5 |
+
"discount_rate": 0.9513,
|
| 6 |
+
"eff_horizon": null,
|
| 7 |
+
"eval_every": 10,
|
| 8 |
+
"duplication_factor": 20,
|
| 9 |
+
"use_wandb": false,
|
| 10 |
+
"num_total_env_steps": 5000000000,
|
| 11 |
+
"checkpoint": "adam_first_ep_g9513",
|
| 12 |
+
"num_levels": null,
|
| 13 |
+
"render_sixel": false,
|
| 14 |
+
"seed": 42,
|
| 15 |
+
"mask_type": "first_episode",
|
| 16 |
+
"penalize_time": false,
|
| 17 |
+
"corner_size": 1,
|
| 18 |
+
"optim": "adam",
|
| 19 |
+
"live_monitor": true,
|
| 20 |
+
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
|
| 21 |
+
},
|
| 22 |
+
"setup": {
|
| 23 |
+
"start_time_utc": "2025-09-22T22:27:03.078571Z",
|
| 24 |
+
"seed": 42,
|
| 25 |
+
"device": "cuda",
|
| 26 |
+
"python_version": "3.11.11",
|
| 27 |
+
"torch_version": "2.7.0+cu126",
|
| 28 |
+
"jax_version": "0.6.2",
|
| 29 |
+
"hostname": "cc99e999c817",
|
| 30 |
+
"platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
|
| 31 |
+
"git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
|
| 32 |
+
"git_branch": "rl/main",
|
| 33 |
+
"use_wandb": false
|
| 34 |
+
}
|
| 35 |
+
}
|
adam_first_ep_g9513/setup.txt
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Start: 2025-09-22T22:27:03.078571Z
|
| 2 |
+
Seed: 42
|
| 3 |
+
Device: cuda
|
| 4 |
+
Python: 3.11.11 | Torch: 2.7.0+cu126 | JAX: 0.6.2
|
| 5 |
+
Host: cc99e999c817
|
| 6 |
+
Platform: Linux-5.15.0-88-generic-x86_64-with-glibc2.35
|
| 7 |
+
Git: branch=rl/main sha=0cf8df44bc95b6408d52e80dc2ef4a758a405a91
|
| 8 |
+
use_wandb: False
|
adam_first_ep_g9513/train.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9513/train.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9868/action_probs.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92322d73f0ed3e29149b6154bd8c4c6c5ba896e52f2b57f853f8cc6f3632a2e7
|
| 3 |
+
size 1574159
|
adam_first_ep_g9868/checkpoints.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3ae51df9cf7dc49e223e0407396579dbd68ee4842493721d7d552a4aa244a88
|
| 3 |
+
size 1547657682
|
adam_first_ep_g9868/config.cfg
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
num_rollout_steps=64
|
| 2 |
+
lr=5e-05
|
| 3 |
+
discount_rate=0.9868
|
| 4 |
+
eff_horizon=None
|
| 5 |
+
eval_every=10
|
| 6 |
+
duplication_factor=20
|
| 7 |
+
use_wandb=False
|
| 8 |
+
num_total_env_steps=5000000000
|
| 9 |
+
checkpoint=adam_first_ep_g9868
|
| 10 |
+
num_levels=None
|
| 11 |
+
render_sixel=False
|
| 12 |
+
seed=42
|
| 13 |
+
mask_type=first_episode
|
| 14 |
+
penalize_time=False
|
| 15 |
+
corner_size=1
|
| 16 |
+
optim=adam
|
| 17 |
+
live_monitor=True
|
| 18 |
+
checkpoint_schedule=0:1,250:2,500:5,1000:10,2000:20
|
adam_first_ep_g9868/config.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"checkpoint": "adam_first_ep_g9868",
|
| 3 |
+
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20",
|
| 4 |
+
"corner_size": 1,
|
| 5 |
+
"discount_rate": 0.9868,
|
| 6 |
+
"duplication_factor": 20,
|
| 7 |
+
"eff_horizon": null,
|
| 8 |
+
"eval_every": 10,
|
| 9 |
+
"live_monitor": true,
|
| 10 |
+
"lr": 5e-05,
|
| 11 |
+
"mask_type": "first_episode",
|
| 12 |
+
"num_levels": null,
|
| 13 |
+
"num_rollout_steps": 64,
|
| 14 |
+
"num_total_env_steps": 5000000000,
|
| 15 |
+
"optim": "adam",
|
| 16 |
+
"penalize_time": false,
|
| 17 |
+
"render_sixel": false,
|
| 18 |
+
"seed": 42,
|
| 19 |
+
"use_wandb": false
|
| 20 |
+
}
|
adam_first_ep_g9868/eval.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9868/eval.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9868/latest_eval.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ts": "2025-09-23T05:46:34.424210Z",
|
| 3 |
+
"loop": 32540,
|
| 4 |
+
"env_steps": 4998144000,
|
| 5 |
+
"exact_value_avg": 0.8878134489059448,
|
| 6 |
+
"regret": 0.0,
|
| 7 |
+
"exact_optimal_return": 0.8878134489059448,
|
| 8 |
+
"action_probs_image_path": "jaxgmg_ckpt_pt/adam_first_ep_g9868/action_probs/img_32540.png"
|
| 9 |
+
}
|
adam_first_ep_g9868/latest_train.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ts": "2025-09-23T05:46:38.964333Z",
|
| 3 |
+
"loop": 32551,
|
| 4 |
+
"env_steps": 4999987200,
|
| 5 |
+
"loss": 1.096579563264477e-10,
|
| 6 |
+
"avg_return": 0.8878134489059448,
|
| 7 |
+
"regret": 0.0,
|
| 8 |
+
"entropy": 3.708085216658219e-08,
|
| 9 |
+
"lr": 5e-05,
|
| 10 |
+
"discount_rate": 0.9868,
|
| 11 |
+
"duplication_factor": 20,
|
| 12 |
+
"num_rollout_steps": 64
|
| 13 |
+
}
|
adam_first_ep_g9868/policy_trace.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:460ee0e5281b293de1ed209432b452e128c50ba862988de42593b8e0bd45a6db
|
| 3 |
+
size 301478
|
adam_first_ep_g9868/setup.json
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"config": {
|
| 3 |
+
"num_rollout_steps": 64,
|
| 4 |
+
"lr": 5e-05,
|
| 5 |
+
"discount_rate": 0.9868,
|
| 6 |
+
"eff_horizon": null,
|
| 7 |
+
"eval_every": 10,
|
| 8 |
+
"duplication_factor": 20,
|
| 9 |
+
"use_wandb": false,
|
| 10 |
+
"num_total_env_steps": 5000000000,
|
| 11 |
+
"checkpoint": "adam_first_ep_g9868",
|
| 12 |
+
"num_levels": null,
|
| 13 |
+
"render_sixel": false,
|
| 14 |
+
"seed": 42,
|
| 15 |
+
"mask_type": "first_episode",
|
| 16 |
+
"penalize_time": false,
|
| 17 |
+
"corner_size": 1,
|
| 18 |
+
"optim": "adam",
|
| 19 |
+
"live_monitor": true,
|
| 20 |
+
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
|
| 21 |
+
},
|
| 22 |
+
"setup": {
|
| 23 |
+
"start_time_utc": "2025-09-23T02:09:04.013196Z",
|
| 24 |
+
"seed": 42,
|
| 25 |
+
"device": "cuda",
|
| 26 |
+
"python_version": "3.11.11",
|
| 27 |
+
"torch_version": "2.7.0+cu126",
|
| 28 |
+
"jax_version": "0.6.2",
|
| 29 |
+
"hostname": "cc99e999c817",
|
| 30 |
+
"platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
|
| 31 |
+
"git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
|
| 32 |
+
"git_branch": "rl/main",
|
| 33 |
+
"use_wandb": false
|
| 34 |
+
}
|
| 35 |
+
}
|
adam_first_ep_g9868/setup.txt
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Start: 2025-09-23T02:09:04.013196Z
|
| 2 |
+
Seed: 42
|
| 3 |
+
Device: cuda
|
| 4 |
+
Python: 3.11.11 | Torch: 2.7.0+cu126 | JAX: 0.6.2
|
| 5 |
+
Host: cc99e999c817
|
| 6 |
+
Platform: Linux-5.15.0-88-generic-x86_64-with-glibc2.35
|
| 7 |
+
Git: branch=rl/main sha=0cf8df44bc95b6408d52e80dc2ef4a758a405a91
|
| 8 |
+
use_wandb: False
|
adam_first_ep_g9868/train.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9868/train.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9964/action_probs.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1d011009d2e8c6a49ebc070b4e1b1bd928adfe94b2b80882c4ba911dc99ba11
|
| 3 |
+
size 1989878
|
adam_first_ep_g9964/checkpoints.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6296ec57625aa728e4b6ab43124511be0de2e005d66232943c09c526071e4d44
|
| 3 |
+
size 1547268470
|
adam_first_ep_g9964/config.cfg
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
num_rollout_steps=64
|
| 2 |
+
lr=5e-05
|
| 3 |
+
discount_rate=0.9964
|
| 4 |
+
eff_horizon=None
|
| 5 |
+
eval_every=10
|
| 6 |
+
duplication_factor=20
|
| 7 |
+
use_wandb=False
|
| 8 |
+
num_total_env_steps=5000000000
|
| 9 |
+
checkpoint=adam_first_ep_g9964
|
| 10 |
+
num_levels=None
|
| 11 |
+
render_sixel=False
|
| 12 |
+
seed=42
|
| 13 |
+
mask_type=first_episode
|
| 14 |
+
penalize_time=False
|
| 15 |
+
corner_size=1
|
| 16 |
+
optim=adam
|
| 17 |
+
live_monitor=True
|
| 18 |
+
checkpoint_schedule=0:1,250:2,500:5,1000:10,2000:20
|
adam_first_ep_g9964/config.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"checkpoint": "adam_first_ep_g9964",
|
| 3 |
+
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20",
|
| 4 |
+
"corner_size": 1,
|
| 5 |
+
"discount_rate": 0.9964,
|
| 6 |
+
"duplication_factor": 20,
|
| 7 |
+
"eff_horizon": null,
|
| 8 |
+
"eval_every": 10,
|
| 9 |
+
"live_monitor": true,
|
| 10 |
+
"lr": 5e-05,
|
| 11 |
+
"mask_type": "first_episode",
|
| 12 |
+
"num_levels": null,
|
| 13 |
+
"num_rollout_steps": 64,
|
| 14 |
+
"num_total_env_steps": 5000000000,
|
| 15 |
+
"optim": "adam",
|
| 16 |
+
"penalize_time": false,
|
| 17 |
+
"render_sixel": false,
|
| 18 |
+
"seed": 42,
|
| 19 |
+
"use_wandb": false
|
| 20 |
+
}
|
adam_first_ep_g9964/eval.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9964/eval.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
adam_first_ep_g9964/latest_eval.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ts": "2025-09-23T09:28:44.224525Z",
|
| 3 |
+
"loop": 32540,
|
| 4 |
+
"env_steps": 4998144000,
|
| 5 |
+
"exact_value_avg": 0.9678743481636047,
|
| 6 |
+
"regret": 1.9073486328125e-05,
|
| 7 |
+
"exact_optimal_return": 0.9678934216499329,
|
| 8 |
+
"action_probs_image_path": "jaxgmg_ckpt_pt/adam_first_ep_g9964/action_probs/img_32540.png"
|
| 9 |
+
}
|
adam_first_ep_g9964/latest_train.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ts": "2025-09-23T09:28:48.788429Z",
|
| 3 |
+
"loop": 32551,
|
| 4 |
+
"env_steps": 4999987200,
|
| 5 |
+
"loss": 0.0012626618845388293,
|
| 6 |
+
"avg_return": 0.967880368232727,
|
| 7 |
+
"regret": 1.9073486328125e-05,
|
| 8 |
+
"entropy": 0.008353522047400475,
|
| 9 |
+
"lr": 5e-05,
|
| 10 |
+
"discount_rate": 0.9964,
|
| 11 |
+
"duplication_factor": 20,
|
| 12 |
+
"num_rollout_steps": 64
|
| 13 |
+
}
|
adam_first_ep_g9964/policy_trace.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8beb4b71b991fb0fe383fae857903794bca5b868081b918e468f7bc32ce4f4e
|
| 3 |
+
size 402139
|
adam_first_ep_g9964/setup.json
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"config": {
|
| 3 |
+
"num_rollout_steps": 64,
|
| 4 |
+
"lr": 5e-05,
|
| 5 |
+
"discount_rate": 0.9964,
|
| 6 |
+
"eff_horizon": null,
|
| 7 |
+
"eval_every": 10,
|
| 8 |
+
"duplication_factor": 20,
|
| 9 |
+
"use_wandb": false,
|
| 10 |
+
"num_total_env_steps": 5000000000,
|
| 11 |
+
"checkpoint": "adam_first_ep_g9964",
|
| 12 |
+
"num_levels": null,
|
| 13 |
+
"render_sixel": false,
|
| 14 |
+
"seed": 42,
|
| 15 |
+
"mask_type": "first_episode",
|
| 16 |
+
"penalize_time": false,
|
| 17 |
+
"corner_size": 1,
|
| 18 |
+
"optim": "adam",
|
| 19 |
+
"live_monitor": true,
|
| 20 |
+
"checkpoint_schedule": "0:1,250:2,500:5,1000:10,2000:20"
|
| 21 |
+
},
|
| 22 |
+
"setup": {
|
| 23 |
+
"start_time_utc": "2025-09-23T05:50:58.197276Z",
|
| 24 |
+
"seed": 42,
|
| 25 |
+
"device": "cuda",
|
| 26 |
+
"python_version": "3.11.11",
|
| 27 |
+
"torch_version": "2.7.0+cu126",
|
| 28 |
+
"jax_version": "0.6.2",
|
| 29 |
+
"hostname": "cc99e999c817",
|
| 30 |
+
"platform": "Linux-5.15.0-88-generic-x86_64-with-glibc2.35",
|
| 31 |
+
"git_sha": "0cf8df44bc95b6408d52e80dc2ef4a758a405a91",
|
| 32 |
+
"git_branch": "rl/main",
|
| 33 |
+
"use_wandb": false
|
| 34 |
+
}
|
| 35 |
+
}
|