Upload train_grpo.py with huggingface_hub
Browse files- train_grpo.py +1 -1
train_grpo.py
CHANGED
|
@@ -270,7 +270,7 @@ def main():
|
|
| 270 |
trainer = GRPOTrainer(
|
| 271 |
model=model,
|
| 272 |
processing_class=tokenizer,
|
| 273 |
-
|
| 274 |
train_dataset=dataset,
|
| 275 |
reward_funcs=reward_fn,
|
| 276 |
)
|
|
|
|
| 270 |
trainer = GRPOTrainer(
|
| 271 |
model=model,
|
| 272 |
processing_class=tokenizer,
|
| 273 |
+
args=config,
|
| 274 |
train_dataset=dataset,
|
| 275 |
reward_funcs=reward_fn,
|
| 276 |
)
|