Spaces:
Sleeping
Sleeping
Fix SFTConfig: move max_seq_length + dataset_text_field to SFTTrainer (trl API change)
Browse files- train_sft.ipynb +10 -5
train_sft.ipynb
CHANGED
|
@@ -2,8 +2,13 @@
|
|
| 2 |
"nbformat": 4,
|
| 3 |
"nbformat_minor": 0,
|
| 4 |
"metadata": {
|
| 5 |
-
"kernelspec": {
|
| 6 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7 |
"accelerator": "GPU"
|
| 8 |
},
|
| 9 |
"cells": [
|
|
@@ -325,8 +330,6 @@
|
|
| 325 |
" eval_steps=50,\n",
|
| 326 |
" save_strategy='no',\n",
|
| 327 |
" report_to='none',\n",
|
| 328 |
-
" max_seq_length=512,\n",
|
| 329 |
-
" dataset_text_field='text',\n",
|
| 330 |
" dataloader_pin_memory=False,\n",
|
| 331 |
" ddp_find_unused_parameters=False,\n",
|
| 332 |
")\n",
|
|
@@ -338,6 +341,8 @@
|
|
| 338 |
" eval_dataset=val_ds,\n",
|
| 339 |
" peft_config=peft_config,\n",
|
| 340 |
" processing_class=tokenizer,\n",
|
|
|
|
|
|
|
| 341 |
")\n",
|
| 342 |
"\n",
|
| 343 |
"print(f'SFTTrainer ready | train={len(train_ds)} val={len(val_ds)}')\n",
|
|
@@ -415,4 +420,4 @@
|
|
| 415 |
]
|
| 416 |
}
|
| 417 |
]
|
| 418 |
-
}
|
|
|
|
| 2 |
"nbformat": 4,
|
| 3 |
"nbformat_minor": 0,
|
| 4 |
"metadata": {
|
| 5 |
+
"kernelspec": {
|
| 6 |
+
"display_name": "Python 3",
|
| 7 |
+
"name": "python3"
|
| 8 |
+
},
|
| 9 |
+
"language_info": {
|
| 10 |
+
"name": "python"
|
| 11 |
+
},
|
| 12 |
"accelerator": "GPU"
|
| 13 |
},
|
| 14 |
"cells": [
|
|
|
|
| 330 |
" eval_steps=50,\n",
|
| 331 |
" save_strategy='no',\n",
|
| 332 |
" report_to='none',\n",
|
|
|
|
|
|
|
| 333 |
" dataloader_pin_memory=False,\n",
|
| 334 |
" ddp_find_unused_parameters=False,\n",
|
| 335 |
")\n",
|
|
|
|
| 341 |
" eval_dataset=val_ds,\n",
|
| 342 |
" peft_config=peft_config,\n",
|
| 343 |
" processing_class=tokenizer,\n",
|
| 344 |
+
" max_seq_length=512,\n",
|
| 345 |
+
" dataset_text_field='text',\n",
|
| 346 |
")\n",
|
| 347 |
"\n",
|
| 348 |
"print(f'SFTTrainer ready | train={len(train_ds)} val={len(val_ds)}')\n",
|
|
|
|
| 420 |
]
|
| 421 |
}
|
| 422 |
]
|
| 423 |
+
}
|