Spaces:
Sleeping
Sleeping
Commit ·
92cd747
1
Parent(s): b4eb298
update
Browse files
examples/tutorials/by_deepspeed/step_2_train_model.py
CHANGED
|
@@ -129,7 +129,7 @@ def main():
|
|
| 129 |
train_dataset=train_dataset,
|
| 130 |
eval_dataset=None, # Can set up evaluation!
|
| 131 |
args=SFTConfig(
|
| 132 |
-
output_dir=(temp_directory / "Qwen3-8B-sft-deepspeed
|
| 133 |
dataset_text_field="formated_text",
|
| 134 |
deepspeed="./ds_config/deepspeed_stage_3_config.json", # 添加deepspeed配置文件
|
| 135 |
per_device_train_batch_size=2,
|
|
|
|
| 129 |
train_dataset=train_dataset,
|
| 130 |
eval_dataset=None, # Can set up evaluation!
|
| 131 |
args=SFTConfig(
|
| 132 |
+
output_dir=(temp_directory / "trainer_output/Qwen3-8B-sft-deepspeed"), # 请替换为你想要的路径
|
| 133 |
dataset_text_field="formated_text",
|
| 134 |
deepspeed="./ds_config/deepspeed_stage_3_config.json", # 添加deepspeed配置文件
|
| 135 |
per_device_train_batch_size=2,
|