DetectiveShadow commited on
Commit
bdf2090
·
verified ·
1 Parent(s): 2488672

This is the model trainer

Files changed (1) hide show
  1. train_model.py +42 -0
train_model.py ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from datasets import load_dataset
2
+ from transformers import T5Tokenizer, T5ForConditionalGeneration, Trainer, TrainingArguments
3
+
4
+ # Load your dataset
5
+ dataset = load_dataset("json", data_files="dataset.jsonl")["train"]
6
+
7
+ # Load tokenizer and model
8
+ model_name = "t5-small"
9
+ tokenizer = T5Tokenizer.from_pretrained(model_name)
10
+ model = T5ForConditionalGeneration.from_pretrained(model_name)
11
+
12
+ # Preprocessing
13
+ def tokenize(example):
14
+ input_enc = tokenizer(example["input"], truncation=True, padding="max_length", max_length=64)
15
+ target_enc = tokenizer(example["output"], truncation=True, padding="max_length", max_length=64)
16
+ input_enc["labels"] = target_enc["input_ids"]
17
+ return input_enc
18
+
19
+ tokenized_data = dataset.map(tokenize)
20
+
21
+ # Training arguments
22
+ training_args = TrainingArguments(
23
+ output_dir="./trivia-genie-t5",
24
+ per_device_train_batch_size=8,
25
+ num_train_epochs=3,
26
+ logging_steps=10,
27
+ save_total_limit=2,
28
+ save_strategy="epoch"
29
+ )
30
+
31
+ trainer = Trainer(
32
+ model=model,
33
+ args=training_args,
34
+ train_dataset=tokenized_data,
35
+ )
36
+
37
+ # Train
38
+ trainer.train()
39
+
40
+ # Optional: Push to Hugging Face Hub
41
+ # model.push_to_hub("your-username/trivia-genie-t5")
42
+ # tokenizer.push_to_hub("your-username/trivia-genie-t5")