jljiu commited on
Commit
0e718d9
·
verified ·
1 Parent(s): 73aa68f

Create train_model.py

Browse files
Files changed (1) hide show
  1. train_model.py +31 -0
train_model.py ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import AutoModelForSequenceClassification, AutoTokenizer
2
+ from transformers import TrainingArguments, Trainer
3
+ import datasets
4
+
5
+
6
+ model_name = "CohereForAI/c4ai - command - r - plus - 08 - 2024"
7
+ model = AutoModelForSequenceClassification.from_pretrained(model_name)
8
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
9
+
10
+
11
+ def preprocess_function(examples):
12
+ return tokenizer(examples["text"], padding="max_length", truncation=True)
13
+
14
+
15
+ dataset = datasets.load_from_disk('models/processed_dataset')
16
+ tokenized_dataset = dataset.map(preprocess_function, batched=True)
17
+
18
+ training_args = TrainingArguments(
19
+ output_dir="models/finetuned_model",
20
+ num_train_epochs=3,
21
+ per_device_train_batch_size=8,
22
+ save_steps=1000,
23
+ save_total_limit=2
24
+ )
25
+
26
+ trainer = Trainer(
27
+ model=model,
28
+ args=training_args,
29
+ train_dataset=tokenized_dataset["train"]
30
+ )
31
+ trainer.train()