pgps-demo / model /module /attention.py
asdfasdfdsafdsa's picture
Initial upload of PGPS demo with all dependencies
383bfb8 verified
import torch
import torch.nn as nn
class Score(nn.Module):
def __init__(self, input_size, hidden_size):
super(Score, self).__init__()
self.attn = nn.Linear(hidden_size + input_size, hidden_size)
self.score = nn.Linear(hidden_size, 1, bias=False)
def forward(self, hidden, candi_embeddings, candi_mask=None):
'''
Arguments:
hidden: B x 1 x 2H
candi_embeddings: B x candi_size x H
candi_mask: B x candi_size
Return:
score: B x candi_size
'''
hidden = hidden.repeat(1, candi_embeddings.size(1), 1) # B x candi_size x H
# For each position of encoder outputs
energy_in = torch.cat((hidden, candi_embeddings), 2) # B x candi_size x 3H
score = self.score(torch.tanh(self.attn(energy_in))).squeeze(-1) # B x candi_size
if candi_mask is not None:
score = score.masked_fill_(~candi_mask, -1e12)
return score
class Attn(nn.Module):
def __init__(self, input_size, hidden_size):
super(Attn, self).__init__()
self.attn = nn.Linear(hidden_size + input_size, hidden_size)
self.score = nn.Linear(hidden_size, 1, bias=False)
def forward(self, hidden, encoder_outputs, seq_mask=None):
'''
Arguments:
hidden: B x 1 x H (q)
encoder_outputs: B x S x H
seq_mask: B x S
Return:
attn_energies: B x S
'''
hidden = hidden.repeat(1, encoder_outputs.size(1), 1) # B x S x H
energy_in = torch.cat((hidden, encoder_outputs), 2) # B x S x 2H
score_feature = torch.tanh(self.attn(energy_in)) # B x S x H
attn_energies = self.score(score_feature).squeeze(-1) # B x S
if seq_mask is not None:
attn_energies = attn_energies.masked_fill_(~seq_mask, -1e12)
attn_energies = nn.functional.softmax(attn_energies, dim=1) # B x S
return attn_energies
class Score_Multi(nn.Module):
def __init__(self, input_size, hidden_size):
super(Score_Multi, self).__init__()
self.attn = nn.Linear(hidden_size + input_size, hidden_size)
self.score = nn.Linear(hidden_size, 1, bias=False)
def forward(self, hidden, candi_embeddings, candi_mask=None):
'''
Arguments:
hidden: B x S x H
candi_embeddings: B x candi_size x H
candi_mask: B x candi_size
Return:
score: B x S x candi_size
'''
hidden = hidden.unsqueeze(2).repeat(1, 1, candi_embeddings.size(1), 1) # B x S x candi_size x H
candi_embeddings = candi_embeddings.unsqueeze(1).repeat(1, hidden.size(1), 1, 1) # B x S x candi_size x H
candi_mask = candi_mask.unsqueeze(1).repeat(1, hidden.size(1), 1) # B x S x candi_size
energy_in = torch.cat((hidden, candi_embeddings), -1) # B x S x candi_size x 2H
score = self.score(torch.tanh(self.attn(energy_in))).squeeze(-1) # B x S x candi_size
if candi_mask is not None:
score = score.masked_fill_(~candi_mask, -1e12)
return score