Spaces:
Running
on
Zero
Running
on
Zero
import torch | |
import torch.nn as nn | |
import torch.nn.functional as F | |
from engine.BiRefNet.config import Config | |
from engine.BiRefNet.models.modules.deform_conv import DeformableConv2d | |
config = Config() | |
class _ASPPModule(nn.Module): | |
def __init__(self, in_channels, planes, kernel_size, padding, dilation): | |
super(_ASPPModule, self).__init__() | |
self.atrous_conv = nn.Conv2d( | |
in_channels, | |
planes, | |
kernel_size=kernel_size, | |
stride=1, | |
padding=padding, | |
dilation=dilation, | |
bias=False, | |
) | |
self.bn = nn.BatchNorm2d(planes) if config.batch_size > 1 else nn.Identity() | |
self.relu = nn.ReLU(inplace=True) | |
def forward(self, x): | |
x = self.atrous_conv(x) | |
x = self.bn(x) | |
return self.relu(x) | |
class ASPP(nn.Module): | |
def __init__(self, in_channels=64, out_channels=None, output_stride=16): | |
super(ASPP, self).__init__() | |
self.down_scale = 1 | |
if out_channels is None: | |
out_channels = in_channels | |
self.in_channelster = 256 // self.down_scale | |
if output_stride == 16: | |
dilations = [1, 6, 12, 18] | |
elif output_stride == 8: | |
dilations = [1, 12, 24, 36] | |
else: | |
raise NotImplementedError | |
self.aspp1 = _ASPPModule( | |
in_channels, self.in_channelster, 1, padding=0, dilation=dilations[0] | |
) | |
self.aspp2 = _ASPPModule( | |
in_channels, | |
self.in_channelster, | |
3, | |
padding=dilations[1], | |
dilation=dilations[1], | |
) | |
self.aspp3 = _ASPPModule( | |
in_channels, | |
self.in_channelster, | |
3, | |
padding=dilations[2], | |
dilation=dilations[2], | |
) | |
self.aspp4 = _ASPPModule( | |
in_channels, | |
self.in_channelster, | |
3, | |
padding=dilations[3], | |
dilation=dilations[3], | |
) | |
self.global_avg_pool = nn.Sequential( | |
nn.AdaptiveAvgPool2d((1, 1)), | |
nn.Conv2d(in_channels, self.in_channelster, 1, stride=1, bias=False), | |
( | |
nn.BatchNorm2d(self.in_channelster) | |
if config.batch_size > 1 | |
else nn.Identity() | |
), | |
nn.ReLU(inplace=True), | |
) | |
self.conv1 = nn.Conv2d(self.in_channelster * 5, out_channels, 1, bias=False) | |
self.bn1 = ( | |
nn.BatchNorm2d(out_channels) if config.batch_size > 1 else nn.Identity() | |
) | |
self.relu = nn.ReLU(inplace=True) | |
self.dropout = nn.Dropout(0.5) | |
def forward(self, x): | |
x1 = self.aspp1(x) | |
x2 = self.aspp2(x) | |
x3 = self.aspp3(x) | |
x4 = self.aspp4(x) | |
x5 = self.global_avg_pool(x) | |
x5 = F.interpolate(x5, size=x1.size()[2:], mode="bilinear", align_corners=True) | |
x = torch.cat((x1, x2, x3, x4, x5), dim=1) | |
x = self.conv1(x) | |
x = self.bn1(x) | |
x = self.relu(x) | |
return self.dropout(x) | |
##################### Deformable | |
class _ASPPModuleDeformable(nn.Module): | |
def __init__(self, in_channels, planes, kernel_size, padding): | |
super(_ASPPModuleDeformable, self).__init__() | |
self.atrous_conv = DeformableConv2d( | |
in_channels, | |
planes, | |
kernel_size=kernel_size, | |
stride=1, | |
padding=padding, | |
bias=False, | |
) | |
self.bn = nn.BatchNorm2d(planes) if config.batch_size > 1 else nn.Identity() | |
self.relu = nn.ReLU(inplace=True) | |
def forward(self, x): | |
x = self.atrous_conv(x) | |
x = self.bn(x) | |
return self.relu(x) | |
class ASPPDeformable(nn.Module): | |
def __init__(self, in_channels, out_channels=None, parallel_block_sizes=[1, 3, 7]): | |
super(ASPPDeformable, self).__init__() | |
self.down_scale = 1 | |
if out_channels is None: | |
out_channels = in_channels | |
self.in_channelster = 256 // self.down_scale | |
self.aspp1 = _ASPPModuleDeformable( | |
in_channels, self.in_channelster, 1, padding=0 | |
) | |
self.aspp_deforms = nn.ModuleList( | |
[ | |
_ASPPModuleDeformable( | |
in_channels, | |
self.in_channelster, | |
conv_size, | |
padding=int(conv_size // 2), | |
) | |
for conv_size in parallel_block_sizes | |
] | |
) | |
self.global_avg_pool = nn.Sequential( | |
nn.AdaptiveAvgPool2d((1, 1)), | |
nn.Conv2d(in_channels, self.in_channelster, 1, stride=1, bias=False), | |
( | |
nn.BatchNorm2d(self.in_channelster) | |
if config.batch_size > 1 | |
else nn.Identity() | |
), | |
nn.ReLU(inplace=True), | |
) | |
self.conv1 = nn.Conv2d( | |
self.in_channelster * (2 + len(self.aspp_deforms)), | |
out_channels, | |
1, | |
bias=False, | |
) | |
self.bn1 = ( | |
nn.BatchNorm2d(out_channels) if config.batch_size > 1 else nn.Identity() | |
) | |
self.relu = nn.ReLU(inplace=True) | |
self.dropout = nn.Dropout(0.5) | |
def forward(self, x): | |
x1 = self.aspp1(x) | |
x_aspp_deforms = [aspp_deform(x) for aspp_deform in self.aspp_deforms] | |
x5 = self.global_avg_pool(x) | |
x5 = F.interpolate(x5, size=x1.size()[2:], mode="bilinear", align_corners=True) | |
x = torch.cat((x1, *x_aspp_deforms, x5), dim=1) | |
x = self.conv1(x) | |
x = self.bn1(x) | |
x = self.relu(x) | |
return self.dropout(x) | |