Update app.py
Browse files
app.py
CHANGED
|
@@ -110,14 +110,13 @@ trainer = SFTTrainer(
|
|
| 110 |
dataset_num_proc=2,
|
| 111 |
packing=False,
|
| 112 |
args=TrainingArguments(
|
| 113 |
-
per_device_train_batch_size=
|
| 114 |
-
gradient_accumulation_steps=
|
| 115 |
learning_rate=2e-4,
|
| 116 |
fp16=not is_bfloat16_supported(),
|
| 117 |
bf16=is_bfloat16_supported(),
|
| 118 |
warmup_steps=5,
|
| 119 |
logging_steps=10,
|
| 120 |
-
max_steps=313,
|
| 121 |
optim="adamw_8bit",
|
| 122 |
weight_decay=0.01,
|
| 123 |
lr_scheduler_type="linear",
|
|
|
|
| 110 |
dataset_num_proc=2,
|
| 111 |
packing=False,
|
| 112 |
args=TrainingArguments(
|
| 113 |
+
per_device_train_batch_size=6,
|
| 114 |
+
gradient_accumulation_steps=6,
|
| 115 |
learning_rate=2e-4,
|
| 116 |
fp16=not is_bfloat16_supported(),
|
| 117 |
bf16=is_bfloat16_supported(),
|
| 118 |
warmup_steps=5,
|
| 119 |
logging_steps=10,
|
|
|
|
| 120 |
optim="adamw_8bit",
|
| 121 |
weight_decay=0.01,
|
| 122 |
lr_scheduler_type="linear",
|