CreatedNull commited on
Commit
3a021d4
·
verified ·
1 Parent(s): 78b4398

Delete train_custommade.py

Browse files
Files changed (1) hide show
  1. train_custommade.py +0 -35
train_custommade.py DELETED
@@ -1,35 +0,0 @@
1
- import json
2
- import torch.nn as nn
3
- import torch
4
- from model import MiniGPT
5
- from dataset import DataLoader,ChatDataset,SimpleTokenizr
6
- from tqdm import tqdm
7
-
8
- with open("./customchatbot-v1/data/merged_data.jsonl", "r", encoding="utf-8") as f:
9
- texts = [json.loads(line)["text"] for line in f if line.strip()]
10
-
11
- tokenizer = SimpleTokenizr()
12
- tokenizer.train(texts)
13
-
14
- model = MiniGPT(vocab_size=100)
15
-
16
- criterion = nn.CrossEntropyLoss()
17
- optimizer = torch.optim.Adam(model.parameters(),lr=0.001)
18
- device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
19
- model.to(device)
20
-
21
- dataset = ChatDataset("./customchatbot-v1/data/merged_data.jsonl", tokenizer)
22
- dataloader = DataLoader(dataset, batch_size=100, shuffle=True)
23
-
24
- def Train(epochs):
25
- for epoch in range(epochs):
26
- model.train()
27
- loop = tqdm(enumerate(dataloader),total=len(dataloader),desc="Training")
28
- tloss = 0
29
- for i,l in loop:
30
- optimizer.zero_grad()
31
- outputs = model(i)
32
- loss = criterion(outputs,l)
33
- loss.backward()
34
-
35
- Train(epochs=1)