tobil commited on
Commit
37174c2
·
verified ·
1 Parent(s): c27b1da

Upload train_grpo.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. train_grpo.py +1 -1
train_grpo.py CHANGED
@@ -270,7 +270,7 @@ def main():
270
  trainer = GRPOTrainer(
271
  model=model,
272
  processing_class=tokenizer,
273
- config=config,
274
  train_dataset=dataset,
275
  reward_funcs=reward_fn,
276
  )
 
270
  trainer = GRPOTrainer(
271
  model=model,
272
  processing_class=tokenizer,
273
+ args=config,
274
  train_dataset=dataset,
275
  reward_funcs=reward_fn,
276
  )