AlgoCore commited on
Commit
2e81e98
·
1 Parent(s): cf0d796

Fix SFTConfig: move max_seq_length + dataset_text_field to SFTTrainer (trl API change)

Browse files
Files changed (1) hide show
  1. train_sft.ipynb +10 -5
train_sft.ipynb CHANGED
@@ -2,8 +2,13 @@
2
  "nbformat": 4,
3
  "nbformat_minor": 0,
4
  "metadata": {
5
- "kernelspec": {"display_name": "Python 3", "name": "python3"},
6
- "language_info": {"name": "python"},
 
 
 
 
 
7
  "accelerator": "GPU"
8
  },
9
  "cells": [
@@ -325,8 +330,6 @@
325
  " eval_steps=50,\n",
326
  " save_strategy='no',\n",
327
  " report_to='none',\n",
328
- " max_seq_length=512,\n",
329
- " dataset_text_field='text',\n",
330
  " dataloader_pin_memory=False,\n",
331
  " ddp_find_unused_parameters=False,\n",
332
  ")\n",
@@ -338,6 +341,8 @@
338
  " eval_dataset=val_ds,\n",
339
  " peft_config=peft_config,\n",
340
  " processing_class=tokenizer,\n",
 
 
341
  ")\n",
342
  "\n",
343
  "print(f'SFTTrainer ready | train={len(train_ds)} val={len(val_ds)}')\n",
@@ -415,4 +420,4 @@
415
  ]
416
  }
417
  ]
418
- }
 
2
  "nbformat": 4,
3
  "nbformat_minor": 0,
4
  "metadata": {
5
+ "kernelspec": {
6
+ "display_name": "Python 3",
7
+ "name": "python3"
8
+ },
9
+ "language_info": {
10
+ "name": "python"
11
+ },
12
  "accelerator": "GPU"
13
  },
14
  "cells": [
 
330
  " eval_steps=50,\n",
331
  " save_strategy='no',\n",
332
  " report_to='none',\n",
 
 
333
  " dataloader_pin_memory=False,\n",
334
  " ddp_find_unused_parameters=False,\n",
335
  ")\n",
 
341
  " eval_dataset=val_ds,\n",
342
  " peft_config=peft_config,\n",
343
  " processing_class=tokenizer,\n",
344
+ " max_seq_length=512,\n",
345
+ " dataset_text_field='text',\n",
346
  ")\n",
347
  "\n",
348
  "print(f'SFTTrainer ready | train={len(train_ds)} val={len(val_ds)}')\n",
 
420
  ]
421
  }
422
  ]
423
+ }