thewisp commited on
Commit
fa35ab8
·
verified ·
1 Parent(s): 17a656c

Upload policy weights, train config and readme

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. train_config.json +1 -1
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5f9ec76d2d307d99f70226b59c7cc8980fc5fe71a7f5764c221f920ff2a48f0
3
  size 29083940
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7a6e456bda184efc769a41bbf4a9f33cc63ef34bbb224408dd4dd05f5769278
3
  size 29083940
train_config.json CHANGED
@@ -125,7 +125,7 @@
125
  "VISUAL": "MEAN_STD"
126
  }
127
  },
128
- "output_dir": "outputs/train/2025-10-19/22-50-21_reward-classifier",
129
  "job_name": "reward-classifier",
130
  "resume": false,
131
  "seed": 2,
 
125
  "VISUAL": "MEAN_STD"
126
  }
127
  },
128
+ "output_dir": "outputs/train/2025-11-02/08-55-25_reward-classifier",
129
  "job_name": "reward-classifier",
130
  "resume": false,
131
  "seed": 2,