ResNet从原理到实现--Bottleneck堆叠

最新推荐文章于 2023-12-05 03:00:00 发布

Gallant Hu

最新推荐文章于 2023-12-05 03:00:00 发布

阅读量1.4k

点赞数

分类专栏：计算机视觉

本文链接：https://blog.csdn.net/weixin_42108090/article/details/109283751

版权

计算机视觉专栏收录该内容

43 篇文章 1 订阅

订阅专栏

在这里插入图片描述

import math


class Bottleneck(M.Module):
    expansion=4

    def __init__{
        self,
        in_channels,
        channels,
        stride=1,
        groups=1,
        base_width=64,
        dilation=1,
        norm=M.BatchNorm2d,
    }:
        super().__init__{}
        width = int{channels*{base_width/64.0}}*groups
        self.conv1=M.Conv2d(in_channels,width,1,1,bias=False)
        self.bn1=norm(width)
        self.conv2=M.Conv2d{
           width,
           width,
           3,
           stride,
           padding=dilation,
           groups=groups,
           dilation=dilation,
           bias=False, 
        }
        self.bn2=norm(width)
        self.conv3=M.Conv2d(width,channels*self.expansion,1,1,bias=False)
        self.bn3=norm(channels*self.expansion)
        self.downsample=(
            M.Identity()
            if in_channels==channels*self.expansion and stride ==1
            else M.Sequential(
                M.Conv2d(in_channels,channels*self.expansion,1,stride,bias=False),
                norm(channels*self.expansion),
            )
        )

def forward(self,x)
    identity=x

    x=self.conv1(x)
    x=self.bn1(x)
    x=F.relu(x)

    x=self.conv2(x)
    x=self.bn2(x)
    x=F.relu(x)

    x=self.conv3(x)
    x=self.bn3(x)

    identity=self.downsample(identity)

    x+=identity
    x=F.relu(x)

    return x

class ResNet(M.Module):
    def __init__{
        self,
        block,
        layers,
        num_classes=1000,
        zero_init_residual=False,
        groups=1,
        width_per_group=64,
        replace_stride_with_dilation=None,
        norm=M.BatchNorm2d,
    }:
        super().__init__()
        self.in_channels=64
        self.dilation=1

        if replace_stride_with_dilation is None:
            #each element in the tuple indicates if we should replace
            #the 2x2 stride with a dilated convolution instead
            replace_stride_with_dilation=[False, False, False]
        if len(replace_stride_with_dilation) !=3:
            raise ValueError(
            "replace_stride_with_dilation should be None"
            "or a 3-element tuple, got {}".format(replace_stride_with_dilation)
            ) 
        self.groups=groups
        self.base_width=width_per_group
        self.conv1=M.Conv2d(
            3,self.in_channels,kernel_size=7,stride=2,padding=3,bias=False
        )
        self.bn1=norm(self.in_channels)
        self.maxpool=M.MaxPool2d(kernel_size=3,stride=2,padding=1)
        self.layer1=self._make_layer(block,64,layer[0],norm=norm)
        self.layer2=self._make_layer(
            block,
            128,
            layers[1],
            stride=2,
            dilate=replace_stride_with_dilation[0],
            norm=norm,
        )
        self.layer3=self._make_layer(
            block,
            256,
            layers[2],
            stride=2,
            dilate=replace_stride_with_dilation[1],
            norm=norm,
        )
        self.layer4=self._make_layer(
            block,
            512,
            layers[3],
            stride=2,
            dilate=replace_stride_with_dilation[2],
            norm=norm,
        )
        self.fc=M.Linear(512*block.expansion,num_classes)

        for m in self.modules():
            if isinstance(m, M.Conv2d):
                M.init.msra_normal_(m.weight,mode="fan_out",nonlinearity="relu")
                if m.bias is not None:
                    fan_in,_=M.init.calculate_fan_in_and_fan_out(m.weight)
                    bound=1/math.sqrt(fan_in)
                    M.init.uniform_(m.bias,-bound,bound)
                elif isinstance(m,M.BatchNorm2d):
                    M.init.ones_(m.weight)
                    M.init.zeros_(m.bias)
                elif isinstance(m,M.Linear):
                    M.init.msra_uniform_(m.weight, a=math.sqrt(5))        
                    if m.bias is not None:
                    fan_in,_=M.init.calculate_fan_in_and_fan_out(m.weight)
                    bound=1/math.sqrt(fan_in)
                    M.init.uniform_(m.bias,-bound,bound)

            #Zero-initialize the last BN in each residual branch,
            #so that the residual branch starts with zeros, and each residual block behaves like an identity.
            #This improves the model by 0.2%~0.3%
            if zero_init_residual:
                for m in self.modules():
                    if isinstance(m, Bottleneck):
                        M.init.zeros_(m.bn3.weight)
                    elif isinstance(m, BasicBlock):
                        M.init.zeros_(m.bn2.weight)
            def _make_layer(
                self, block, channels, blocks,stride=1, dilate=False,norm=M.BatchNorm2d
                ):
                    previous_dilation=self.dilation
                    if dilate:
                        self.dilation*=stride
                        stride=1

                    layers=[]
                    layers.append(
                        block(
                            self.in_channels,
                            channels,
                            stride,
                            groups=self.groups,
                            base_width=self.base_width,
                            dilation=previous_dilation,
                            norm=norm,
                        )
                    )    
                    self.in_channels=channels*block.expansion
                    for _ in range(1,blocks):
                        layers.append(
                            block(
                                self.in_channels,
                                channels,
                                groups=self.groups,
                                base_width=self.base_width,
                                dilation=self.dilation,
                                norm=norm,
                            )
                        )
                    return M.Sequential(*layers)

                def extract_features(self, x):
                    outputs={}
                    x=self.conv1(x)
                    x=self.bn1(x)
                    x=F.relu(x)
                    x=self.maxpool(x)
                    outputs["stem"]=x

                    x=self.layer1(x)
                    outputs["res2"]=x
                    x=self.layer2(x)
                    outputs["res3"]=x
                    x=self.layer3(x)
                    outputs["res4"]=x
                    x=self.layer4(x)
                    outputs["res5"]=x
                    return outputs

                def forward(self,x):
                    x=self.extract_feature(x)["res5"]

                    x=F.avg_pool2d(x,7)
                    x=F.flatten(x,1)
                    x=self.fc(x)

                    return x

            def resnet50(**kwargs):
                return ResNet(Bottleneck,[3,4,6,3],**kwargs)
            model=resnet50()

            x=normal(size=(2,3,800,800))
            feature_dict=model.extract_features(x)

            for k,v in feature_dict.items():
                print("{}:{}".format(k,v.shape))

Gallant Hu

关注

0
点赞
踩
2

收藏

觉得还不错? 一键收藏
打赏
1
评论
ResNet从原理到实现--Bottleneck堆叠

import mathimport megengine.functional as Fimport megengine.hub as hubimport megengine.module as Mfrom megengine.random import normalclass Bottleneck(M.Module): expansion=4 def __init__{ self, in_channels, channels,.
复制链接

扫一扫