import torch
import torch.nn as nn
use_cuda = torch.cuda.is_available()
class dw_conv(nn.Module):
# Depthwise convolution, currently slow to train in PyTorch
def __init__(self, in_dim, out_dim, stride):
super(dw_conv, self).__init__()
self.dw_conv_k3 = nn.Conv2d(
in_dim, out_dim, kernel_size=3, stride=stride, groups=in_dim, bias=False)
self.bn = nn.BatchNorm2d(out_dim)
self.relu = nn.ReLU(inplace=True)
def forward(self, x):
x = self.dw_conv_k3(x)
x = self.bn(x)
x = self.relu(x)
return x
class point_conv(nn.Module):
# Pointwise 1 x 1 convolution
def __init__(self, in_dim, out_dim):
super(point_conv, self).__init__()
self.p_conv_k1 = nn.Conv2d(in_dim, out_dim, kernel_size=1, bias=False)
self.bn = nn.BatchNorm2d(out_dim)
self.relu = nn.ReLU(inplace=True)
def forward(self, x):
x = self.p_conv_k1(x)
x = self.bn(x)
x = self.relu(x)
return x
class MobileNets(nn.Module):
def __init__(self, num_classes, large_img):
super(MobileNets, self).__init__()
self.num_classes = num_classes
if large_img:
self.features = nn.Sequential(
nn.Conv2d(3, 32, kernel_size=3, stride=2),
nn.ReLU(inplace=True),
dw_conv(32, 32, 1),
point_conv(32, 64),
dw_conv(64, 64, 2),
point_conv(64, 128),
dw_conv(128, 128, 1),
point_conv(128, 128),
dw_conv(128, 128, 2),
point_conv(128, 256),
dw_conv(256, 256, 1),
point_conv(256, 256),
dw_conv(256, 256, 2),
point_conv(256, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 2),
point_conv(512, 1024),
dw_conv(1024, 1024, 2),
point_conv(1024, 1024),
nn.AvgPool2d(7),
)
else:
self.features = nn.Sequential(
nn.Conv2d(3, 32, kernel_size=3, stride=1),
nn.ReLU(inplace=True),
dw_conv(32, 32, 1),
point_conv(32, 64),
dw_conv(64, 64, 1),
point_conv(64, 128),
dw_conv(128, 128, 1),
point_conv(128, 128),
dw_conv(128, 128, 1),
point_conv(128, 256),
dw_conv(256, 256, 1),
point_conv(256, 256),
dw_conv(256, 256, 1),
point_conv(256, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 512),
dw_conv(512, 512, 1),
point_conv(512, 1024),
dw_conv(1024, 1024, 1),
point_conv(1024, 1024),
nn.AvgPool2d(4),
)
self.fc = nn.Linear(1024, self.num_classes)
def forward(self, x):
x = self.features(x)
x = x.view(-1, 1024)
x = self.fc(x)
return x
def mobilenet(num_classes, large_img, **kwargs):
model = MobileNets(num_classes, large_img, **kwargs)
if use_cuda:
model = model.cuda()
return model
MobileNetV1 = mobilenet(12, False)
print(MobileNetV1)
MobileNets(
(features): Sequential(
(0): Conv2d(3, 32, kernel_size=(3, 3), stride=(1, 1))
(1): ReLU(inplace=True)
(2): dw_conv(
(dw_conv_k3): Conv2d(32, 32, kernel_size=(3, 3), stride=(1, 1), groups=32, bias=False)
(bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(3): point_conv(
(p_conv_k1): Conv2d(32, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(4): dw_conv(
(dw_conv_k3): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), groups=64, bias=False)
(bn): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(5): point_conv(
(p_conv_k1): Conv2d(64, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(6): dw_conv(
(dw_conv_k3): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), groups=128, bias=False)
(bn): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(7): point_conv(
(p_conv_k1): Conv2d(128, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(8): dw_conv(
(dw_conv_k3): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), groups=128, bias=False)
(bn): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(9): point_conv(
(p_conv_k1): Conv2d(128, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(10): dw_conv(
(dw_conv_k3): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), groups=256, bias=False)
(bn): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(11): point_conv(
(p_conv_k1): Conv2d(256, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(12): dw_conv(
(dw_conv_k3): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), groups=256, bias=False)
(bn): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(13): point_conv(
(p_conv_k1): Conv2d(256, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(14): dw_conv(
(dw_conv_k3): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), groups=512, bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(15): point_conv(
(p_conv_k1): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(16): dw_conv(
(dw_conv_k3): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), groups=512, bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(17): point_conv(
(p_conv_k1): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(18): dw_conv(
(dw_conv_k3): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), groups=512, bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(19): point_conv(
(p_conv_k1): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(20): dw_conv(
(dw_conv_k3): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), groups=512, bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(21): point_conv(
(p_conv_k1): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(22): dw_conv(
(dw_conv_k3): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), groups=512, bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(23): point_conv(
(p_conv_k1): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(24): dw_conv(
(dw_conv_k3): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), groups=512, bias=False)
(bn): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(25): point_conv(
(p_conv_k1): Conv2d(512, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(26): dw_conv(
(dw_conv_k3): Conv2d(1024, 1024, kernel_size=(3, 3), stride=(1, 1), groups=1024, bias=False)
(bn): BatchNorm2d(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(27): point_conv(
(p_conv_k1): Conv2d(1024, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)
(bn): BatchNorm2d(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
(relu): ReLU(inplace=True)
)
(28): AvgPool2d(kernel_size=4, stride=4, padding=0)
)
(fc): Linear(in_features=1024, out_features=12, bias=True)
)