davidquarel commited on
Commit
f47d4fc
·
verified ·
1 Parent(s): c842500

Delete folder al_1.0_g_0.98_id_26_seed_981026 with huggingface_hub

Browse files
al_1.0_g_0.98_id_26_seed_981026/action_logprobs.pth.gz DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:008d8627a75df610fab9fcc19c1eff149ab3e56f0dcb9aa99460c24527f777b1
3
- size 254670524
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/action_probs.tar.gz DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:abf07a704faeae0954e6915701b4911befa0fb74e645157ada6b0718b78c52d8
3
- size 168081776
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/checkpoints.tar.gz DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4836b15b17644912a1e63e3d5f6657ebb835eb4da22c3f3decb825f16ab0ade1
3
- size 1538936040
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/config.cfg DELETED
@@ -1,69 +0,0 @@
1
- rl_action=train
2
- num_rollout_steps=64
3
- lr=5e-05
4
- discount_rate=0.98
5
- eff_horizon=None
6
- eval_every=1
7
- use_wandb=True
8
- use_hf=True
9
- use_log=True
10
- log_optimizer_state=True
11
- num_total_env_steps=10000000000
12
- checkpoint=al_1.0_g_0.98_id_26_seed_981026
13
- render_sixel=False
14
- sixel_idx=60
15
- seed=981026
16
- run_id=26
17
- seed_formula={int(discount_rate*100):02d}{int(alpha*10):02d}{run_id:02d}
18
- mask_type=first_episode
19
- penalize_time=False
20
- optim=adam
21
- live_monitor=False
22
- use_bf16=False
23
- deterministic=True
24
- eval_schedule=0:1,250:2,500:5,2000:10
25
- grad_acc_per_chunk=5
26
- num_rollout_chunks=1
27
- cheese_loc=any
28
- env_rule=None
29
- env_layout=open
30
- alpha=1.0
31
- env_size=13
32
- num_levels=9600
33
- f_str_ckpt=al_{alpha}_g_{discount_rate}_id_{run_id}_seed_{seed}
34
- wandb_project=jaxgmg2_3phase_optim_state
35
- ckpt_dir=jaxgmg2_3phase_optim_state
36
- duplication_factor=-1
37
- smoke=False
38
- compile=True
39
- num_chains=6
40
- num_draws=3000
41
- num_steps_bw_draws=1
42
- on_policy=True
43
- llc_nbeta=3000
44
- localization=10
45
- exact_solver_each_draw=False
46
- llc_optimizer=sgld
47
- iw_clip_eps=None
48
- rmsprop_burnin_steps=20
49
- llc_data_file=llc_scan_open_reinforce.pkl
50
- llc_checkpoint_index=None
51
- llc_checkpoint_number=None
52
- sink=None
53
- repo_id=davidquarel/jaxgmg_ckpt_zip
54
- use_shuffled_checkpoints=False
55
- force_re_download=False
56
- off_distribution_data=False
57
- weight_restrictions=None
58
- weight_restrictions_invert=False
59
- evaluate_every_position=False
60
- num_prev_actions=1
61
- ntfy=david_jaxgmg
62
- vis_average_state=False
63
- use_prev_action=False
64
- ckpt_path=jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_26_seed_981026
65
- env_steps_per_loop=614400
66
- total_loops=16276
67
- eff_acc_steps=5
68
- env_steps_per_microbatch=122880
69
- chunk_size=9600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/config.json DELETED
@@ -1,71 +0,0 @@
1
- {
2
- "alpha": 1.0,
3
- "checkpoint": "al_1.0_g_0.98_id_26_seed_981026",
4
- "cheese_loc": "any",
5
- "chunk_size": 9600,
6
- "ckpt_dir": "jaxgmg2_3phase_optim_state",
7
- "ckpt_path": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_26_seed_981026",
8
- "compile": true,
9
- "deterministic": true,
10
- "discount_rate": 0.98,
11
- "duplication_factor": -1,
12
- "eff_acc_steps": 5,
13
- "eff_horizon": null,
14
- "env_layout": "open",
15
- "env_rule": null,
16
- "env_size": 13,
17
- "env_steps_per_loop": 614400,
18
- "env_steps_per_microbatch": 122880,
19
- "eval_every": 1,
20
- "eval_schedule": "0:1,250:2,500:5,2000:10",
21
- "evaluate_every_position": false,
22
- "exact_solver_each_draw": false,
23
- "f_str_ckpt": "al_{alpha}_g_{discount_rate}_id_{run_id}_seed_{seed}",
24
- "force_re_download": false,
25
- "grad_acc_per_chunk": 5,
26
- "iw_clip_eps": null,
27
- "live_monitor": false,
28
- "llc_checkpoint_index": null,
29
- "llc_checkpoint_number": null,
30
- "llc_data_file": "llc_scan_open_reinforce.pkl",
31
- "llc_nbeta": 3000,
32
- "llc_optimizer": "sgld",
33
- "localization": 10,
34
- "log_optimizer_state": true,
35
- "lr": 5e-05,
36
- "mask_type": "first_episode",
37
- "ntfy": "david_jaxgmg",
38
- "num_chains": 6,
39
- "num_draws": 3000,
40
- "num_levels": 9600,
41
- "num_prev_actions": 1,
42
- "num_rollout_chunks": 1,
43
- "num_rollout_steps": 64,
44
- "num_steps_bw_draws": 1,
45
- "num_total_env_steps": 10000000000,
46
- "off_distribution_data": false,
47
- "on_policy": true,
48
- "optim": "adam",
49
- "penalize_time": false,
50
- "render_sixel": false,
51
- "repo_id": "davidquarel/jaxgmg_ckpt_zip",
52
- "rl_action": "train",
53
- "rmsprop_burnin_steps": 20,
54
- "run_id": 26,
55
- "seed": 981026,
56
- "seed_formula": "{int(discount_rate*100):02d}{int(alpha*10):02d}{run_id:02d}",
57
- "sink": null,
58
- "sixel_idx": 60,
59
- "smoke": false,
60
- "total_loops": 16276,
61
- "use_bf16": false,
62
- "use_hf": true,
63
- "use_log": true,
64
- "use_prev_action": false,
65
- "use_shuffled_checkpoints": false,
66
- "use_wandb": true,
67
- "vis_average_state": false,
68
- "wandb_project": "jaxgmg2_3phase_optim_state",
69
- "weight_restrictions": null,
70
- "weight_restrictions_invert": false
71
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/eval.jsonl DELETED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_26_seed_981026/eval.log DELETED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_26_seed_981026/latest_train.json DELETED
@@ -1,12 +0,0 @@
1
- {
2
- "ts": "2026-02-11T01:55:25.062078Z",
3
- "loop": 16275,
4
- "env_steps": 9999979917,
5
- "loss": 0.01797681301832199,
6
- "avg_return": 0.8826010227203369,
7
- "regret": 5.442580004455522e-05,
8
- "entropy": 0.08681736141443253,
9
- "lr": 5e-05,
10
- "discount_rate": 0.98,
11
- "num_rollout_steps": 64
12
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/optimizer_state.tar.gz DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:59366206997987b4969ca55126ec72b7963253a2c70fe067a6188f6732a8db2d
3
- size 2780043060
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/setup.json DELETED
@@ -1,86 +0,0 @@
1
- {
2
- "config": {
3
- "rl_action": "train",
4
- "num_rollout_steps": 64,
5
- "lr": 5e-05,
6
- "discount_rate": 0.98,
7
- "eff_horizon": null,
8
- "eval_every": 1,
9
- "use_wandb": true,
10
- "use_hf": true,
11
- "use_log": true,
12
- "log_optimizer_state": true,
13
- "num_total_env_steps": 10000000000,
14
- "checkpoint": "al_1.0_g_0.98_id_26_seed_981026",
15
- "render_sixel": false,
16
- "sixel_idx": 60,
17
- "seed": 981026,
18
- "run_id": 26,
19
- "seed_formula": "{int(discount_rate*100):02d}{int(alpha*10):02d}{run_id:02d}",
20
- "mask_type": "first_episode",
21
- "penalize_time": false,
22
- "optim": "adam",
23
- "live_monitor": false,
24
- "use_bf16": false,
25
- "deterministic": true,
26
- "eval_schedule": "0:1,250:2,500:5,2000:10",
27
- "grad_acc_per_chunk": 5,
28
- "num_rollout_chunks": 1,
29
- "cheese_loc": "any",
30
- "env_rule": null,
31
- "env_layout": "open",
32
- "alpha": 1.0,
33
- "env_size": 13,
34
- "num_levels": 9600,
35
- "f_str_ckpt": "al_{alpha}_g_{discount_rate}_id_{run_id}_seed_{seed}",
36
- "wandb_project": "jaxgmg2_3phase_optim_state",
37
- "ckpt_dir": "jaxgmg2_3phase_optim_state",
38
- "duplication_factor": -1,
39
- "smoke": false,
40
- "compile": true,
41
- "num_chains": 6,
42
- "num_draws": 3000,
43
- "num_steps_bw_draws": 1,
44
- "on_policy": true,
45
- "llc_nbeta": 3000,
46
- "localization": 10,
47
- "exact_solver_each_draw": false,
48
- "llc_optimizer": "sgld",
49
- "iw_clip_eps": null,
50
- "rmsprop_burnin_steps": 20,
51
- "llc_data_file": "llc_scan_open_reinforce.pkl",
52
- "llc_checkpoint_index": null,
53
- "llc_checkpoint_number": null,
54
- "sink": null,
55
- "repo_id": "davidquarel/jaxgmg_ckpt_zip",
56
- "use_shuffled_checkpoints": false,
57
- "force_re_download": false,
58
- "off_distribution_data": false,
59
- "weight_restrictions": null,
60
- "weight_restrictions_invert": false,
61
- "evaluate_every_position": false,
62
- "num_prev_actions": 1,
63
- "ntfy": "david_jaxgmg",
64
- "vis_average_state": false,
65
- "use_prev_action": false,
66
- "ckpt_path": "jaxgmg2_3phase_optim_state/al_1.0_g_0.98_id_26_seed_981026",
67
- "env_steps_per_loop": 614400,
68
- "total_loops": 16276,
69
- "eff_acc_steps": 5,
70
- "env_steps_per_microbatch": 122880,
71
- "chunk_size": 9600
72
- },
73
- "setup": {
74
- "start_time_utc": "2026-02-10T21:55:56.256399Z",
75
- "seed": 981026,
76
- "device": "cuda",
77
- "python_version": "3.11.11",
78
- "torch_version": "2.10.0+cu128",
79
- "jax_version": "0.6.2",
80
- "hostname": "4ff4d48ec3b4",
81
- "platform": "Linux-5.15.0-156-generic-x86_64-with-glibc2.35",
82
- "git_sha": null,
83
- "git_branch": null,
84
- "use_wandb": true
85
- }
86
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/setup.txt DELETED
@@ -1,8 +0,0 @@
1
- Start: 2026-02-10T21:55:56.256399Z
2
- Seed: 981026
3
- Device: cuda
4
- Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2
5
- Host: 4ff4d48ec3b4
6
- Platform: Linux-5.15.0-156-generic-x86_64-with-glibc2.35
7
- Git: branch=None sha=None
8
- use_wandb: True
 
 
 
 
 
 
 
 
 
al_1.0_g_0.98_id_26_seed_981026/train.jsonl DELETED
The diff for this file is too large to render. See raw diff
 
al_1.0_g_0.98_id_26_seed_981026/train.log DELETED
The diff for this file is too large to render. See raw diff