Hajime MATSUMOTO commited on
Commit
702c22f
Β·
1 Parent(s): ce5bcf8

Reduce batch size to avoid OOM on L40S 48GB

Browse files
Files changed (1) hide show
  1. train.py +4 -4
train.py CHANGED
@@ -234,10 +234,10 @@ training_args = TrainingArguments(
234
  num_train_epochs=2,
235
  max_steps=-1, # -1 = エポックベース
236
 
237
- # バッチァむズ (L40S 48GBγͺγ‚‰ε€§γγε–γ‚Œγ‚‹)
238
- per_device_train_batch_size=8,
239
- per_device_eval_batch_size=8,
240
- gradient_accumulation_steps=4, # ζœ‰εŠΉγƒγƒƒγƒγ‚΅γ‚€γ‚Ί: 8*4=32
241
 
242
  # ε­¦ηΏ’ηŽ‡
243
  learning_rate=1e-4,
 
234
  num_train_epochs=2,
235
  max_steps=-1, # -1 = エポックベース
236
 
237
+ # バッチァむズ (L40S 48GB + 7B QLoRA)
238
+ per_device_train_batch_size=2,
239
+ per_device_eval_batch_size=2,
240
+ gradient_accumulation_steps=16, # ζœ‰εŠΉγƒγƒƒγƒγ‚΅γ‚€γ‚Ί: 2*16=32
241
 
242
  # ε­¦ηΏ’ηŽ‡
243
  learning_rate=1e-4,