File size: 4,336 Bytes
4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 4e188a6 5bf6359 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 |
import torch
import torch.nn as nn
import math
#from transformers import AutoModelForCausalLM, AutoTokenizer
class LSTM(nn.Module):
def _init_(self, input_size, lstm_layer_sizes,linear_layer_size, output_size):
super(LSTM, self)._init_()
self.input_size = input_size
self.linear_layer_size = linear_layer_size
self.lstm_layer_1 = nn.LSTM(input_size, lstm_layer_sizes[0], batch_first=True)
self.lstm_layer_2 = nn.LSTM(lstm_layer_sizes[0], lstm_layer_sizes[1], batch_first=True)
self.lstm_layer_3 = nn.LSTM(lstm_layer_sizes[1], lstm_layer_sizes[2], batch_first=True)
self.fc = Linear(lstm_layer_sizes[2], self.linear_layer_size,output_size)
self.apply(self.initialize_weights)
def forward(self, x):
out, (hn_1, cn_1) = self.lstm_layer_1(x)
out, (hn_2, cn_2) = self.lstm_layer_2(out)
out, (hn_3, cn_3) = self.lstm_layer_3(out)
out = hn_3[-1]
out = self.fc(out)
return out
def initialize_weights(self, layer):
if isinstance(layer, nn.Linear):
nn.init.xavier_uniform_(layer.weight)
nn.init.zeros_(layer.bias)
elif isinstance(layer, nn.LSTM):
for name, param in layer.named_parameters():
if 'weight' in name:
nn.init.xavier_uniform_(param.data)
elif 'bias' in name:
nn.init.zeros_(param.data)
class Linear(nn.Module):
def _init_(self,input_size,hidden_sizes,output_size):
super(Linear,self)._init_()
self.relu =nn.ReLU()
self.sigmoid =nn.Sigmoid()
self.tanh = nn.Tanh()
self.input = nn.Linear(input_size,hidden_sizes[0])
self.fc = nn.Linear(hidden_sizes[0],hidden_sizes[1])
self.output = nn.Linear(hidden_sizes[1],output_size)
self.apply(self.initialize_weights)
def forward(self,x):
out = self.relu(self.input(x))
out = self.relu(self.fc(out))
out = self.relu(self.output(out))
return out
def initialize_weights(self, layer):
if isinstance(layer, nn.Linear):
nn.init.xavier_uniform_(layer.weight)
nn.init.zeros_(layer.bias)
class LUCLSTM(nn.Module):
def _init_(self, input_size, lstm_layer_sizes, output_size):
super(LUCLSTM, self)._init_()
self.input_size = input_size
self.lstm_layer_1 = nn.LSTM(input_size, lstm_layer_sizes[0], batch_first=True)
self.lstm_layer_2 = nn.LSTM(lstm_layer_sizes[0], lstm_layer_sizes[1], batch_first=True)
self.lstm_layer_3 = nn.LSTM(lstm_layer_sizes[1], lstm_layer_sizes[2], batch_first=True)
self.fc = nn.Linear(lstm_layer_sizes[2],64)
self.fc2 = nn.Linear(64,output_size)
self.tanh = nn.Tanh()
self.relu =nn.ReLU()
self.apply(self.initialize_weights)
def forward(self, x):
out, (hn_1, cn_1) = self.lstm_layer_1(x)
out, (hn_2, cn_2) = self.lstm_layer_2(out)
out, (hn_3, cn_3) = self.lstm_layer_3(out)
out = hn_3[-1]
out = self.tanh(self.fc(out))
out = self.fc2(out)
return out
def initialize_weights(self, layer):
if isinstance(layer, nn.Linear):
nn.init.xavier_uniform_(layer.weight)
nn.init.zeros_(layer.bias)
elif isinstance(layer, nn.LSTM):
for name, param in layer.named_parameters():
if 'weight' in name:
nn.init.xavier_uniform_(param.data)
elif 'bias' in name:
nn.init.zeros_(param.data)
class PositionalEncoding(nn.Module):
def _init_(self, dim, max_len=300):
super(PositionalEncoding, self)._init_()
pe = torch.zeros(max_len, dim)
position = torch.arange(0, max_len, dtype=torch.float).unsqueeze(1)
div_term = torch.exp(torch.arange(0, dim, 2).float() * (-math.log(10000.0) / dim))
pe[:, 0::2] = torch.sin(position * div_term)
pe[:, 1::2] = torch.cos(position * div_term)
pe = pe.unsqueeze(0).transpose(0, 1)
self.register_buffer('pe', pe)
def forward(self, x):
return x + self.pe[:x.size(0), :]
class Transformer(nn.Module):
def _init_(self):
super(Transformer,self)._init_() |