cpt core 4
Browse files
scripts/cpt_core_model_4.py
CHANGED
|
@@ -88,8 +88,10 @@ trainer = UnslothTrainer(
|
|
| 88 |
args = UnslothTrainingArguments(
|
| 89 |
# per_device_train_batch_size=16,
|
| 90 |
# gradient_accumulation_steps=64,
|
| 91 |
-
per_device_train_batch_size=16,
|
| 92 |
-
gradient_accumulation_steps=16,
|
|
|
|
|
|
|
| 93 |
|
| 94 |
warmup_ratio=0,
|
| 95 |
num_train_epochs=1,
|
|
|
|
| 88 |
args = UnslothTrainingArguments(
|
| 89 |
# per_device_train_batch_size=16,
|
| 90 |
# gradient_accumulation_steps=64,
|
| 91 |
+
# per_device_train_batch_size=16,
|
| 92 |
+
# gradient_accumulation_steps=16,
|
| 93 |
+
per_device_train_batch_size=2,
|
| 94 |
+
gradient_accumulation_steps=8,
|
| 95 |
|
| 96 |
warmup_ratio=0,
|
| 97 |
num_train_epochs=1,
|