| """ |
| Feature Fusion for Varible-Length Data Processing |
| AFF/iAFF is referred and modified from https://github.com/YimianDai/open-aff/blob/master/aff_pytorch/aff_net/fusion.py |
| According to the paper: Yimian Dai et al, Attentional Feature Fusion, IEEE Winter Conference on Applications of Computer Vision, WACV 2021 |
| """ |
|
|
| import torch |
| import torch.nn as nn |
|
|
|
|
| class DAF(nn.Module): |
| """ |
| 直接相加 DirectAddFuse |
| """ |
|
|
| def __init__(self): |
| super(DAF, self).__init__() |
|
|
| def forward(self, x, residual): |
| return x + residual |
|
|
|
|
| class iAFF(nn.Module): |
| """ |
| 多特征融合 iAFF |
| """ |
|
|
| def __init__(self, channels=64, r=4, type="2D"): |
| super(iAFF, self).__init__() |
| inter_channels = int(channels // r) |
|
|
| if type == "1D": |
| |
| self.local_att = nn.Sequential( |
| nn.Conv1d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv1d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(channels), |
| ) |
|
|
| |
| self.global_att = nn.Sequential( |
| nn.AdaptiveAvgPool1d(1), |
| nn.Conv1d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv1d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(channels), |
| ) |
|
|
| |
| self.local_att2 = nn.Sequential( |
| nn.Conv1d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv1d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(channels), |
| ) |
| |
| self.global_att2 = nn.Sequential( |
| nn.AdaptiveAvgPool1d(1), |
| nn.Conv1d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv1d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(channels), |
| ) |
| elif type == "2D": |
| |
| self.local_att = nn.Sequential( |
| nn.Conv2d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv2d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(channels), |
| ) |
|
|
| |
| self.global_att = nn.Sequential( |
| nn.AdaptiveAvgPool2d(1), |
| nn.Conv2d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv2d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(channels), |
| ) |
|
|
| |
| self.local_att2 = nn.Sequential( |
| nn.Conv2d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv2d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(channels), |
| ) |
| |
| self.global_att2 = nn.Sequential( |
| nn.AdaptiveAvgPool2d(1), |
| nn.Conv2d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv2d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(channels), |
| ) |
| else: |
| raise f"the type is not supported" |
|
|
| self.sigmoid = nn.Sigmoid() |
|
|
| def forward(self, x, residual): |
| flag = False |
| xa = x + residual |
| if xa.size(0) == 1: |
| xa = torch.cat([xa, xa], dim=0) |
| flag = True |
| xl = self.local_att(xa) |
| xg = self.global_att(xa) |
| xlg = xl + xg |
| wei = self.sigmoid(xlg) |
| xi = x * wei + residual * (1 - wei) |
|
|
| xl2 = self.local_att2(xi) |
| xg2 = self.global_att(xi) |
| xlg2 = xl2 + xg2 |
| wei2 = self.sigmoid(xlg2) |
| xo = x * wei2 + residual * (1 - wei2) |
| if flag: |
| xo = xo[0].unsqueeze(0) |
| return xo |
|
|
|
|
| class AFF(nn.Module): |
| """ |
| 多特征融合 AFF |
| """ |
|
|
| def __init__(self, channels=64, r=4, type="2D"): |
| super(AFF, self).__init__() |
| inter_channels = int(channels // r) |
|
|
| if type == "1D": |
| self.local_att = nn.Sequential( |
| nn.Conv1d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv1d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(channels), |
| ) |
| self.global_att = nn.Sequential( |
| nn.AdaptiveAvgPool1d(1), |
| nn.Conv1d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv1d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm1d(channels), |
| ) |
| elif type == "2D": |
| self.local_att = nn.Sequential( |
| nn.Conv2d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv2d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(channels), |
| ) |
| self.global_att = nn.Sequential( |
| nn.AdaptiveAvgPool2d(1), |
| nn.Conv2d(channels, inter_channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(inter_channels), |
| nn.ReLU(inplace=True), |
| nn.Conv2d(inter_channels, channels, kernel_size=1, stride=1, padding=0), |
| nn.BatchNorm2d(channels), |
| ) |
| else: |
| raise f"the type is not supported." |
|
|
| self.sigmoid = nn.Sigmoid() |
|
|
| def forward(self, x, residual): |
| flag = False |
| xa = x + residual |
| if xa.size(0) == 1: |
| xa = torch.cat([xa, xa], dim=0) |
| flag = True |
| xl = self.local_att(xa) |
| xg = self.global_att(xa) |
| xlg = xl + xg |
| wei = self.sigmoid(xlg) |
| xo = 2 * x * wei + 2 * residual * (1 - wei) |
| if flag: |
| xo = xo[0].unsqueeze(0) |
| return xo |
|
|