rishikasrinivas commited on
Commit
5661ef4
·
verified ·
1 Parent(s): 5cb8df3

Create model.py

Browse files
Files changed (1) hide show
  1. model.py +34 -0
model.py ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+
3
+ from transformers import BertForSequenceClassification, BertTokenizer, DataCollatorForTokenClassification
4
+ import numpy as np
5
+ device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
6
+
7
+ class BERT():
8
+ def __init__(self):
9
+ self.num_classes = 13
10
+ self.device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
11
+
12
+
13
+
14
+ # Load pre-trained model and tokenizer
15
+ self.model = BertForSequenceClassification.from_pretrained("bert-base-uncased").to(self.device)
16
+ self.tokenizer = BertTokenizer.from_pretrained("bert-base-uncased")
17
+
18
+ # Modify the output layer to match the number of classes
19
+ self.model.classifier = torch.nn.Linear(in_features = 768, out_features= self.num_classes)
20
+ self.data_collator = DataCollatorForTokenClassification(self.tokenizer)
21
+
22
+ def getModel(self):
23
+ return self.model
24
+
25
+
26
+ def get_tokenizer(self):
27
+ return self.tokenizer
28
+
29
+ def tokenize(self, txt):
30
+ return self.tokenizer(txt, return_tensors='pt')
31
+
32
+
33
+
34
+