Upload policy weights, train config and readme
Browse files- model.safetensors +1 -1
- train_config.json +1 -1
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 29083940
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7a6e456bda184efc769a41bbf4a9f33cc63ef34bbb224408dd4dd05f5769278
|
| 3 |
size 29083940
|
train_config.json
CHANGED
|
@@ -125,7 +125,7 @@
|
|
| 125 |
"VISUAL": "MEAN_STD"
|
| 126 |
}
|
| 127 |
},
|
| 128 |
-
"output_dir": "outputs/train/2025-
|
| 129 |
"job_name": "reward-classifier",
|
| 130 |
"resume": false,
|
| 131 |
"seed": 2,
|
|
|
|
| 125 |
"VISUAL": "MEAN_STD"
|
| 126 |
}
|
| 127 |
},
|
| 128 |
+
"output_dir": "outputs/train/2025-11-02/08-55-25_reward-classifier",
|
| 129 |
"job_name": "reward-classifier",
|
| 130 |
"resume": false,
|
| 131 |
"seed": 2,
|