davidquarel commited on
Commit
ef13532
·
verified ·
1 Parent(s): eb1f92b

Upload folder using huggingface_hub

Browse files
al_0.47_g_0.99_seed_106_pa_1/action_logprobs.pth.gz CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9069e34e1868ecd34aa62c095151fa5e3d0a632619a4c30ed539e46858016f88
3
- size 63325170
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19d307f0ef60cbfa0ea935882004892e8413b88112b75177d44b43547e58b926
3
+ size 324318394
al_0.47_g_0.99_seed_106_pa_1/action_probs.tar.gz CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c98a9d744be6c9677a8ed3d3a97522428f3272191a885b099c981e1726b93cf4
3
- size 29047848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be80be8fe2dd8aa2ef07f751fad74e9be0957459cf9df68c60fe2de413004344
3
+ size 35336044
al_0.47_g_0.99_seed_106_pa_1/checkpoints.tar.gz CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c087f3a877ca05e55cace401455d52e4c1f0389e2f016359b869fae4397fe71
3
- size 644711178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b734c0a9ffbbca92a81a5824ed2b7f4ba9a48ccc0aadd10f9cb8e231ec652332
3
+ size 648775730
al_0.47_g_0.99_seed_106_pa_1/config.cfg CHANGED
@@ -53,6 +53,6 @@ off_distribution_data=False
53
  weight_restrictions=None
54
  weight_restrictions_invert=False
55
  evaluate_every_position=False
56
- use_prev_action=False
57
  num_prev_actions=1
58
  ntfy=david_jaxgmg
 
53
  weight_restrictions=None
54
  weight_restrictions_invert=False
55
  evaluate_every_position=False
56
+ use_prev_action=True
57
  num_prev_actions=1
58
  ntfy=david_jaxgmg
al_0.47_g_0.99_seed_106_pa_1/config.json CHANGED
@@ -51,7 +51,7 @@
51
  "use_bf16": false,
52
  "use_hf": true,
53
  "use_log": true,
54
- "use_prev_action": false,
55
  "use_shuffled_checkpoints": false,
56
  "use_wandb": true,
57
  "wandb_project": "jaxgmg2_3phase_seed",
 
51
  "use_bf16": false,
52
  "use_hf": true,
53
  "use_log": true,
54
+ "use_prev_action": true,
55
  "use_shuffled_checkpoints": false,
56
  "use_wandb": true,
57
  "wandb_project": "jaxgmg2_3phase_seed",
al_0.47_g_0.99_seed_106_pa_1/eval.jsonl CHANGED
The diff for this file is too large to render. See raw diff
 
al_0.47_g_0.99_seed_106_pa_1/eval.log CHANGED
The diff for this file is too large to render. See raw diff
 
al_0.47_g_0.99_seed_106_pa_1/latest_train.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "ts": "2026-01-26T19:34:20.975856Z",
3
  "loop": 8137,
4
  "env_steps": 4999987199,
5
- "loss": 0.019173111766576767,
6
- "avg_return": 0.9238110780715942,
7
- "regret": 0.0019405159400776029,
8
- "entropy": 0.11560589075088501,
9
  "lr": 5e-05,
10
  "discount_rate": 0.99,
11
  "num_rollout_steps": 64
 
1
  {
2
+ "ts": "2026-01-26T19:50:34.534160Z",
3
  "loop": 8137,
4
  "env_steps": 4999987199,
5
+ "loss": 0.02855975739657879,
6
+ "avg_return": 0.9214302897453308,
7
+ "regret": 0.0033544208854436874,
8
+ "entropy": 0.14067891240119934,
9
  "lr": 5e-05,
10
  "discount_rate": 0.99,
11
  "num_rollout_steps": 64
al_0.47_g_0.99_seed_106_pa_1/setup.json CHANGED
@@ -55,19 +55,19 @@
55
  "weight_restrictions": null,
56
  "weight_restrictions_invert": false,
57
  "evaluate_every_position": false,
58
- "use_prev_action": false,
59
  "num_prev_actions": 1,
60
  "ntfy": "david_jaxgmg"
61
  },
62
  "setup": {
63
- "start_time_utc": "2026-01-26T17:40:27.316049Z",
64
  "seed": 106,
65
  "device": "cuda",
66
  "python_version": "3.11.11",
67
  "torch_version": "2.10.0+cu128",
68
  "jax_version": "0.6.2",
69
- "hostname": "627114e368a8",
70
- "platform": "Linux-6.8.0-90-generic-x86_64-with-glibc2.35",
71
  "git_sha": null,
72
  "git_branch": null,
73
  "use_wandb": true
 
55
  "weight_restrictions": null,
56
  "weight_restrictions_invert": false,
57
  "evaluate_every_position": false,
58
+ "use_prev_action": true,
59
  "num_prev_actions": 1,
60
  "ntfy": "david_jaxgmg"
61
  },
62
  "setup": {
63
+ "start_time_utc": "2026-01-26T17:56:29.817897Z",
64
  "seed": 106,
65
  "device": "cuda",
66
  "python_version": "3.11.11",
67
  "torch_version": "2.10.0+cu128",
68
  "jax_version": "0.6.2",
69
+ "hostname": "8cd943fb5175",
70
+ "platform": "Linux-6.8.0-87-generic-x86_64-with-glibc2.35",
71
  "git_sha": null,
72
  "git_branch": null,
73
  "use_wandb": true
al_0.47_g_0.99_seed_106_pa_1/setup.txt CHANGED
@@ -1,8 +1,8 @@
1
- Start: 2026-01-26T17:40:27.316049Z
2
  Seed: 106
3
  Device: cuda
4
  Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2
5
- Host: 627114e368a8
6
- Platform: Linux-6.8.0-90-generic-x86_64-with-glibc2.35
7
  Git: branch=None sha=None
8
  use_wandb: True
 
1
+ Start: 2026-01-26T17:56:29.817897Z
2
  Seed: 106
3
  Device: cuda
4
  Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2
5
+ Host: 8cd943fb5175
6
+ Platform: Linux-6.8.0-87-generic-x86_64-with-glibc2.35
7
  Git: branch=None sha=None
8
  use_wandb: True
al_0.47_g_0.99_seed_106_pa_1/train.jsonl CHANGED
The diff for this file is too large to render. See raw diff
 
al_0.47_g_0.99_seed_106_pa_1/train.log CHANGED
The diff for this file is too large to render. See raw diff