Spaces:
Sleeping
Sleeping
Update README.md
Browse files
README.md
CHANGED
|
@@ -197,8 +197,8 @@ docker run -p 7860:7860 exec-assist
|
|
| 197 |
```python
|
| 198 |
GRPOConfig(
|
| 199 |
learning_rate=1e-6, # critical, 5e-6 caused collapse
|
| 200 |
-
per_device_train_batch_size=
|
| 201 |
-
gradient_accumulation_steps=
|
| 202 |
num_generations=8, # diversity within group
|
| 203 |
num_train_epochs=3,
|
| 204 |
beta=0.1, # KL penalty, prevents mode collapse
|
|
|
|
| 197 |
```python
|
| 198 |
GRPOConfig(
|
| 199 |
learning_rate=1e-6, # critical, 5e-6 caused collapse
|
| 200 |
+
per_device_train_batch_size=1,
|
| 201 |
+
gradient_accumulation_steps=8,
|
| 202 |
num_generations=8, # diversity within group
|
| 203 |
num_train_epochs=3,
|
| 204 |
beta=0.1, # KL penalty, prevents mode collapse
|