| | |
| | |
| | |
| | |
| | |
| |
|
| | import torch.nn as nn |
| | import torch |
| |
|
| | num_parallel = 2 |
| |
|
| |
|
| | class TokenExchange(nn.Module): |
| | def __init__(self): |
| | super(TokenExchange, self).__init__() |
| |
|
| | def forward(self, x, mask, mask_threshold): |
| | |
| | x0, x1 = torch.zeros_like(x[0]), torch.zeros_like(x[1]) |
| | x0[mask[0] >= mask_threshold] = x[0][mask[0] >= mask_threshold] |
| | x0[mask[0] < mask_threshold] = x[1][mask[0] < mask_threshold] |
| | x1[mask[1] >= mask_threshold] = x[1][mask[1] >= mask_threshold] |
| | x1[mask[1] < mask_threshold] = x[0][mask[1] < mask_threshold] |
| | return [x0, x1] |
| |
|
| |
|
| | class ModuleParallel(nn.Module): |
| | def __init__(self, module): |
| | super(ModuleParallel, self).__init__() |
| | self.module = module |
| |
|
| | def forward(self, x_parallel): |
| | return [self.module(x) for x in x_parallel] |
| |
|
| |
|
| | class LayerNormParallel(nn.Module): |
| | def __init__(self, num_features): |
| | super(LayerNormParallel, self).__init__() |
| | for i in range(num_parallel): |
| | setattr(self, 'ln_' + str(i), nn.LayerNorm(num_features, eps=1e-6)) |
| |
|
| | def forward(self, x_parallel): |
| | return [getattr(self, 'ln_' + str(i))(x) for i, x in enumerate(x_parallel)] |