附上代码:
import torch.nn as nn
import torch
class AlexNet(nn.Module):
def __init__(self, num_classes=1000, init_weights=True):
super(AlexNet, self).__init__()
self.features = nn.Sequential(
nn.Conv2d(3, 48, kernel_size=11, stride=4, padding=2), # input[3, 224, 224] output[48, 55, 55]
nn.ReLU(inplace=True),
nn.MaxPool2d(kernel_size=3, stride=2), # output[48, 27, 27]
nn.Conv2d(48, 128, kernel_size=5, padding=2), # output[128, 27, 27]
nn.ReLU(inplace=True),
nn.MaxPool2d(kernel_size=3, stride=2), # output[128, 13, 13]
nn.Conv2d(128, 192, kernel_size=3, padding=1), # output[192, 13, 13]
nn.ReLU(inplace=True),
nn.Conv2d(192, 192, kernel_size=3, padding=1), # output[192, 13, 13]
nn.ReLU(inplace=True),
nn.Conv2d(192, 128, kernel_size=3, padding=1), # output[128, 13, 13]
nn.ReLU(inplace=True),
nn.MaxPool2d(kernel_size=3, stride=2), # output[128, 6, 6]
)
self.classifier = nn.Sequential(
nn.Dropout(p=0.5),
nn.Linear(128 * 6 * 6, 2048),
nn.ReLU(inplace=True),
nn.Dropout(p=0.5),
nn.Linear(2048, 2048),
nn.ReLU(inplace=True),
nn.Linear(2048, num_classes),
)
if init_weights:
self._initialize_weights()
def forward(self, x):
x = self.features(x)
x = torch.flatten(x, start_dim=1)#进行展平处理,索引从1开始即是从channel开始,因为pytorch的tensor通道排序为:[batch,channel,height,weight]
x = self.classifier(x)
return x
def _initialize_weights(self):
for m in self.modules():#self.modules继承自nn.Module()
if isinstance(m, nn.Conv2d):#isinstance判断在self.modules()中遍历的模块m是否为nn.Cond2d
nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')#如果是,就采用kaiming_normal_初始化方法,对卷积权重m.weight进行初始化
if m.bias is not None:#如果偏执不为空
nn.init.constant_(m.bias, 0)#就用0进行初始化
elif isinstance(m, nn.Linear):#如果m是全连接层
nn.init.normal_(m.weight, 0, 0.01)#采用normal_(正态分布)进行初始化,其中0为均值,0.01为方差
nn.init.constant_(m.bias, 0)#对偏执进行初始化为0
# import torch
# input1=torch.rand([32,3,224,224])
# model=AlexNet()
# print(model)
# output=model(input1)