miyuki2026 commited on
Commit
d251d39
·
1 Parent(s): 61148f6
examples/tutorials/dpo/ultrafeedback-dpo/step_2_train_dpo_model_single_gpu.py CHANGED
@@ -169,7 +169,7 @@ def main():
169
  warmup_steps=100,
170
  lr_scheduler_type="cosine",
171
  fp16=False,
172
- gradient_checkpointing=False, # 如果内存紧张,可以设为 True
173
  optim="adamw_torch",
174
  report_to="none",
175
  max_length=1024 if debug_mode else 2048, # prompt + chosen 的最大长度
 
169
  warmup_steps=100,
170
  lr_scheduler_type="cosine",
171
  fp16=False,
172
+ gradient_checkpointing=True, # 如果内存紧张,可以设为 True
173
  optim="adamw_torch",
174
  report_to="none",
175
  max_length=1024 if debug_mode else 2048, # prompt + chosen 的最大长度