DevanshuDon commited on
Commit
63cf282
·
verified ·
1 Parent(s): 084bf21

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -197,8 +197,8 @@ docker run -p 7860:7860 exec-assist
197
  ```python
198
  GRPOConfig(
199
  learning_rate=1e-6, # critical, 5e-6 caused collapse
200
- per_device_train_batch_size=2,
201
- gradient_accumulation_steps=4,
202
  num_generations=8, # diversity within group
203
  num_train_epochs=3,
204
  beta=0.1, # KL penalty, prevents mode collapse
 
197
  ```python
198
  GRPOConfig(
199
  learning_rate=1e-6, # critical, 5e-6 caused collapse
200
+ per_device_train_batch_size=1,
201
+ gradient_accumulation_steps=8,
202
  num_generations=8, # diversity within group
203
  num_train_epochs=3,
204
  beta=0.1, # KL penalty, prevents mode collapse