Spaces:
Runtime error
Runtime error
Update grpo_train.py
Browse files- grpo_train.py +1 -1
grpo_train.py
CHANGED
|
@@ -344,7 +344,7 @@ trainer = GRPOTrainer(
|
|
| 344 |
logging_steps=5,
|
| 345 |
warmup_ratio=0.1,
|
| 346 |
bf16=True,
|
| 347 |
-
fp16=
|
| 348 |
report_to="none",
|
| 349 |
),
|
| 350 |
train_dataset=dataset,
|
|
|
|
| 344 |
logging_steps=5,
|
| 345 |
warmup_ratio=0.1,
|
| 346 |
bf16=True,
|
| 347 |
+
fp16=False,
|
| 348 |
report_to="none",
|
| 349 |
),
|
| 350 |
train_dataset=dataset,
|