miyuki2026 commited on
Commit
61148f6
·
1 Parent(s): 51c46da
examples/tutorials/dpo/ultrafeedback-dpo/step_2_train_dpo_model_single_gpu.py CHANGED
@@ -168,7 +168,7 @@ def main():
168
  learning_rate=2e-5,
169
  warmup_steps=100,
170
  lr_scheduler_type="cosine",
171
- fp16=True if torch.cuda.is_available() else False,
172
  gradient_checkpointing=False, # 如果内存紧张,可以设为 True
173
  optim="adamw_torch",
174
  report_to="none",
 
168
  learning_rate=2e-5,
169
  warmup_steps=100,
170
  lr_scheduler_type="cosine",
171
+ fp16=False,
172
  gradient_checkpointing=False, # 如果内存紧张,可以设为 True
173
  optim="adamw_torch",
174
  report_to="none",