tizzymouse commited on
Commit
4e056e4
·
verified ·
1 Parent(s): ce2b52c

Upload policy weights, train config and readme

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. train_config.json +5 -5
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:546c534d7dd63e3f0f381b61719a1aa7a27700bc9c9e4f8c0659ef57f873a7d0
3
  size 33810140
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e71da8750f56e836fcb6fa95086255173adbc540370baabf82a7d4acbe43759
3
  size 33810140
train_config.json CHANGED
@@ -141,7 +141,7 @@
141
  "VISUAL": "MEAN_STD"
142
  }
143
  },
144
- "output_dir": "outputs/train/2025-10-23/13-56-12_hil-serl2-reward-classifier",
145
  "job_name": "hil-serl2-reward-classifier",
146
  "resume": false,
147
  "seed": 2,
@@ -171,13 +171,13 @@
171
  "use_async_envs": false
172
  },
173
  "wandb": {
174
- "enable": false,
175
  "disable_artifact": false,
176
  "project": "hil-serl2-reward-classifier",
177
  "entity": null,
178
- "notes": null,
179
- "run_id": null,
180
- "mode": null
181
  },
182
  "checkpoint_path": null
183
  }
 
141
  "VISUAL": "MEAN_STD"
142
  }
143
  },
144
+ "output_dir": "outputs/train/2025-10-23/14-40-04_hil-serl2-reward-classifier",
145
  "job_name": "hil-serl2-reward-classifier",
146
  "resume": false,
147
  "seed": 2,
 
171
  "use_async_envs": false
172
  },
173
  "wandb": {
174
+ "enable": true,
175
  "disable_artifact": false,
176
  "project": "hil-serl2-reward-classifier",
177
  "entity": null,
178
+ "notes": "Reward classifier training (hil-serl2)",
179
+ "run_id": "ounj4wu6",
180
+ "mode": "online"
181
  },
182
  "checkpoint_path": null
183
  }