Upload train_infrastructure_model.py with huggingface_hub
Browse files
train_infrastructure_model.py
CHANGED
|
@@ -112,6 +112,7 @@ training_args = SFTConfig(
|
|
| 112 |
per_device_eval_batch_size=4,
|
| 113 |
gradient_accumulation_steps=4,
|
| 114 |
gradient_checkpointing=True,
|
|
|
|
| 115 |
|
| 116 |
# Optimization
|
| 117 |
learning_rate=2e-4,
|
|
@@ -145,6 +146,8 @@ training_args = SFTConfig(
|
|
| 145 |
|
| 146 |
# Misc
|
| 147 |
seed=42,
|
|
|
|
|
|
|
| 148 |
)
|
| 149 |
|
| 150 |
# Initialize trainer
|
|
@@ -155,9 +158,6 @@ trainer = SFTTrainer(
|
|
| 155 |
eval_dataset=eval_dataset,
|
| 156 |
peft_config=peft_config,
|
| 157 |
args=training_args,
|
| 158 |
-
max_seq_length=2048,
|
| 159 |
-
dataset_text_field="text",
|
| 160 |
-
packing=False,
|
| 161 |
)
|
| 162 |
|
| 163 |
# Train
|
|
|
|
| 112 |
per_device_eval_batch_size=4,
|
| 113 |
gradient_accumulation_steps=4,
|
| 114 |
gradient_checkpointing=True,
|
| 115 |
+
max_seq_length=2048,
|
| 116 |
|
| 117 |
# Optimization
|
| 118 |
learning_rate=2e-4,
|
|
|
|
| 146 |
|
| 147 |
# Misc
|
| 148 |
seed=42,
|
| 149 |
+
dataset_text_field="text",
|
| 150 |
+
packing=False,
|
| 151 |
)
|
| 152 |
|
| 153 |
# Initialize trainer
|
|
|
|
| 158 |
eval_dataset=eval_dataset,
|
| 159 |
peft_config=peft_config,
|
| 160 |
args=training_args,
|
|
|
|
|
|
|
|
|
|
| 161 |
)
|
| 162 |
|
| 163 |
# Train
|