resnet代码分析

先导入使用的包，并声明可用的网络和预训练好的模型

import torch.nn as nn

import torch.utils.model_zoo as model_zoo

#声明可调用的网络

__all__ = ['ResNet', 'resnet18', 'resnet34', 'resnet50', 'resnet101',

           'resnet152']

#用于加载的预训练好的模型

model_urls = {

    'resnet18': 'https://download.pytorch.org/models/resnet18-5c106cde.pth',

    'resnet34': 'https://download.pytorch.org/models/resnet34-333f7ec4.pth',

    'resnet50': 'https://download.pytorch.org/models/resnet50-19c8e357.pth',

    'resnet101': 'https://download.pytorch.org/models/resnet101-5d3b4d8f.pth',

    'resnet152': 'https://download.pytorch.org/models/resnet152-b121ed2d.pth',

}

定义要使用到的1*1和3*3的卷积层

#卷积核为3*，padding=，stride=1(默认,根据实际传入参数设定),dilation=,groups=,bias=False的二维卷积

def conv3x3(in_planes, out_planes, stride=):

    """3x3 convolution with padding"""

    return nn.Conv2d(in_planes, out_planes, kernel_size=, stride=stride,

                     padding=, bias=False)

#卷积核为1*，padding=，stride=1(默认,根据实际传入参数设定),dilation=,groups=,bias=False的二维卷积

def conv1x1(in_planes, out_planes, stride=):

    """1x1 convolution"""

    return nn.Conv2d(in_planes, out_planes, kernel_size=, stride=stride, bias=False)

注意：这里bias设置为False,原因是：

下面使用了Batch Normalization，而其对隐藏层 $Z^{[l]}=W^{[l]}A^{[l-1]}+b^{[l]}$ 有去均值的操作，所以这里的常数项 $b^{[l]}$ 可以消去

因为Batch Normalization有一个操作 $\tilde z^{(i)}=\gamma\cdot z^{(i)}_{norm}+\beta$ ，所以上面 $b^{[l]}$ 的数值效果是能由 $\beta$ 所替代的

因此我们在使用Batch Norm的时候，可以忽略各隐藏层的常数项 $b^{[l]}$ 。

这样在使用梯度下降算法时，只用对 $W^{[l]}$ ， $\beta^{[l]}$ 和 $\gamma^{[l]}$ 进行迭代更新

实现两层的残差块

比如：

#这个实现的是两层的残差块，用于resnet18/

class BasicBlock(nn.Module):

    expansion = 

    def __init__(self, inplanes, planes, stride=, downsample=None):

        super(BasicBlock, self).__init__()

        self.conv1 = conv3x3(inplanes, planes, stride)

        self.bn1 = nn.BatchNorm2d(planes)

        self.relu = nn.ReLU(inplace=True)

        self.conv2 = conv3x3(planes, planes)

        self.bn2 = nn.BatchNorm2d(planes)

        self.downsample = downsample

        self.stride = stride

    def forward(self, x):

        identity = x

        out = self.conv1(x)

        out = self.bn1(out)

        out = self.relu(out)

        out = self.conv2(out)

        out = self.bn2(out)

        if self.downsample is not None: #当连接的维度不同时，使用1*1的卷积核将低维转成高维，然后才能进行相加

            identity = self.downsample(x)

        out += identity #实现H(x)=F(x)+x或H(x)=F(x)+Wx

        out = self.relu(out)

        return out

4.实现3层的残差块

如图：

#这个实现的是三层的残差块，用于resnet50//

class Bottleneck(nn.Module):

    expansion = 

    def __init__(self, inplanes, planes, stride=, downsample=None):

        super(Bottleneck, self).__init__()

        self.conv1 = conv1x1(inplanes, planes)

        self.bn1 = nn.BatchNorm2d(planes)

        self.conv2 = conv3x3(planes, planes, stride)

        self.bn2 = nn.BatchNorm2d(planes)

        self.conv3 = conv1x1(planes, planes * self.expansion)

        self.bn3 = nn.BatchNorm2d(planes * self.expansion)

        self.relu = nn.ReLU(inplace=True)

        self.downsample = downsample

        self.stride = stride

    def forward(self, x):

        identity = x

        out = self.conv1(x)

        out = self.bn1(out)

        out = self.relu(out)

        out = self.conv2(out)

        out = self.bn2(out)

        out = self.relu(out)

        out = self.conv3(out)

        out = self.bn3(out)

        if self.downsample is not None:

            identity = self.downsample(x) #当连接的维度不同时，使用1*1的卷积核将低维转成高维，然后才能进行相加

        out += identity #实现H(x)=F(x)+x或H(x)=F(x)+Wx

        out = self.relu(out)

        return out

5.整个网络实现

class ResNet(nn.Module):

    #参数block指明残差块是两层或三层，参数layers指明每个卷积层需要的残差块数量，num_classes指明分类数，zero_init_residual是否初始化为0

    def __init__(self, block, layers, num_classes=, zero_init_residual=False):

        super(ResNet, self).__init__()

        self.inplanes =  #一开始先使用64**7的卷积核,stride=, padding=

        self.conv1 = nn.Conv2d(, , kernel_size=, stride=, padding=,

                               bias=False) #3通道的输入RGB图像数据变为64通道的数据

        self.bn1 = nn.BatchNorm2d()

        self.relu = nn.ReLU(inplace=True) #以上是第一层卷积--

        self.maxpool = nn.MaxPool2d(kernel_size=, stride=, padding=) #然后进行最大值池化操作--

        self.layer1 = self._make_layer(block, , layers[])#下面就是所有的卷积层的设置--

        self.layer2 = self._make_layer(block, , layers[], stride=)

        self.layer3 = self._make_layer(block, , layers[], stride=)

        self.layer4 = self._make_layer(block, , layers[], stride=)

        self.avgpool = nn.AdaptiveAvgPool2d((, )) #进行自适应平均池化--

        self.fc = nn.Linear( * block.expansion, num_classes)#全连接层--

        for m in self.modules():

            if isinstance(m, nn.Conv2d):

                #kaiming高斯初始化，目的是使得Conv2d卷积层反向传播的输出的方差都为1

                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')

            elif isinstance(m, nn.BatchNorm2d):

                #初始化m.weight，即gamma的值为1；m.bias即beta的值为0

                nn.init.constant_(m.weight, )

                nn.init.constant_(m.bias, )

        # 在每个残差分支中初始化最后一个BN，即BatchNorm2d

        # 以便残差分支以零开始，并且每个残差块的行为类似于一个恒等式。

        # This improves the model by 0.2~0.3% according to https://arxiv.org/abs/1706.02677

        if zero_init_residual:

            for m in self.modules():

                if isinstance(m, Bottleneck):#Bottleneck的最后一个BN是m.bn3

                    nn.init.constant_(m.bn3.weight, )

                elif isinstance(m, BasicBlock):#BasicBlock的最后一个BN是m.bn2

                    nn.init.constant_(m.bn2.weight, )

    #实现一层卷积，block参数指定是两层残差块或三层残差块，planes参数为输入的channel数，blocks说明该卷积有几个残差块

    def _make_layer(self, block, planes, blocks, stride=):

        downsample = None

        #即如果该层的输入的channel数inplanes和其输出的channel数planes * block.expansion不同，

        #那要使用1*1的卷积核将输入x低维转成高维，然后才能进行相加

        if stride !=  or self.inplanes != planes * block.expansion:

            downsample = nn.Sequential(

                conv1x1(self.inplanes, planes * block.expansion, stride),

                nn.BatchNorm2d(planes * block.expansion),

            )

        layers = []

        #只有卷积和卷积直接的连接需要低维转高维

        layers.append(block(self.inplanes, planes, stride, downsample))

        self.inplanes = planes * block.expansion

        for _ in range(, blocks):

            layers.append(block(self.inplanes, planes))

        return nn.Sequential(*layers)

    def forward(self, x):

        x = self.conv1(x)

        x = self.bn1(x)

        x = self.relu(x)

        x = self.maxpool(x)

        x = self.layer1(x)

        x = self.layer2(x)

        x = self.layer3(x)

        x = self.layer4(x)

        x = self.avgpool(x)

        x = x.view(x.size(), -)

        x = self.fc(x)

        return x

6.不同层次网络实现

#18层的resnet

def resnet18(pretrained=False, **kwargs):

    """Constructs a ResNet-18 model.

    Args:

        pretrained (bool): If True, returns a model pre-trained on ImageNet

    """

    model = ResNet(BasicBlock, [, , , ], **kwargs)

    if pretrained:#是否使用已经训练好的预训练模型，在此基础上继续训练

        model.load_state_dict(model_zoo.load_url(model_urls['resnet18']))

    return model

#34层的resnet

def resnet34(pretrained=False, **kwargs):

    """Constructs a ResNet-34 model.

    Args:

        pretrained (bool): If True, returns a model pre-trained on ImageNet

    """

    model = ResNet(BasicBlock, [, , , ], **kwargs)

    if pretrained:#是否使用已经训练好的预训练模型，在此基础上继续训练

        model.load_state_dict(model_zoo.load_url(model_urls['resnet34']))

    return model

#50层的resnet

def resnet50(pretrained=False, **kwargs):

    """Constructs a ResNet-50 model.

    Args:

        pretrained (bool): If True, returns a model pre-trained on ImageNet

    """

    model = ResNet(Bottleneck, [, , , ], **kwargs)

    if pretrained:#是否使用已经训练好的预训练模型，在此基础上继续训练

        model.load_state_dict(model_zoo.load_url(model_urls['resnet50']))

    return model

#101层的resnet

def resnet101(pretrained=False, **kwargs):

    """Constructs a ResNet-101 model.

    Args:

        pretrained (bool): If True, returns a model pre-trained on ImageNet

    """

    model = ResNet(Bottleneck, [, , , ], **kwargs)

    if pretrained:#是否使用已经训练好的预训练模型，在此基础上继续训练

        model.load_state_dict(model_zoo.load_url(model_urls['resnet101']))

    return model

#152层的resnet

def resnet152(pretrained=False, **kwargs):

    """Constructs a ResNet-152 model.

    Args:

        pretrained (bool): If True, returns a model pre-trained on ImageNet

    """

    model = ResNet(Bottleneck, [, , , ], **kwargs)

    if pretrained:#是否使用已经训练好的预训练模型，在此基础上继续训练

        model.load_state_dict(model_zoo.load_url(model_urls['resnet152']))

    return model

resnet代码分析的更多相关文章

Android代码分析工具lint学习
1 lint简介 1.1 概述 lint是随Android SDK自带的一个静态代码分析工具.它用来对Android工程的源文件进行检查,找出在正确性.安全.性能.可使用性.可访问性及国际化等方面可能 ...
pmd静态代码分析
在正式进入测试之前,进行一定的静态代码分析及code review对代码质量及系统提高是有帮助的,以上为数据证明 Pmd 它是一个基于静态规则集的Java源码分析器,它可以识别出潜在的如下问题:– 可 ...
[Asp.net 5] DependencyInjection项目代码分析-目录
微软DI文章系列如下所示: [Asp.net 5] DependencyInjection项目代码分析 [Asp.net 5] DependencyInjection项目代码分析2-Autofac [ ...
[Asp.net 5] DependencyInjection项目代码分析4-微软的实现（5）（IEnumerable<>补充）
Asp.net 5的依赖注入注入系列可以参考链接: [Asp.net 5] DependencyInjection项目代码分析-目录我们在之前讲微软的实现时,对于OpenIEnumerableSer ...
完整全面的Java资源库（包括构建、操作、代码分析、编译器、数据库、社区等等）
构建这里搜集了用来构建应用程序的工具. Apache Maven:Maven使用声明进行构建并进行依赖管理,偏向于使用约定而不是配置进行构建.Maven优于Apache Ant.后者采用了一种过程化 ...
STM32启动代码分析 IAR 比较好
stm32启动代码分析 (2012-06-12 09:43:31) 转载▼ 最近开始使用ST的stm32w108芯片(也是一款zigbee芯片).开始看他的启动代码看的晕晕呼呼呼的. 还好在c ...
常用 Java 静态代码分析工具的分析与比较
常用 Java 静态代码分析工具的分析与比较简介: 本文首先介绍了静态代码分析的基本概念及主要技术,随后分别介绍了现有 4 种主流 Java 静态代码分析工具 (Checkstyle,FindBu ...
SonarQube-5.6.3 代码分析平台搭建使用
python代码分析官网主页: http://docs.sonarqube.org/display/PLUG/Python+Plugin Windows下安装使用: 快速使用: 1．下载jdk ht ...
angular代码分析之异常日志设计
angular代码分析之异常日志设计错误异常是面向对象开发中的记录提示程序执行问题的一种重要机制,在程序执行发生问题的条件下,异常会在中断程序执行,同时会沿着代码的执行路径一步一步的向上抛出异常,最 ...

随机推荐

eShopOnContainers 知多少[4]：Catalog microservice
引言 Catalog microservice(目录微服务)维护着所有产品信息,包括库存.价格.所以该微服务的核心业务为: 产品信息的维护库存的更新价格的维护架构模式如上图所示,本微服务采用简 ...
kafka基础知识点
1.安装: 1.1. 前置安装要求:java + zookeeper 1.2. 下载安装包:http://mirros.cnnic.cn/apache/kafka/0.9.00/kafka_2.10- ...
PLC
https://www.cnblogs.com/dathlin/p/7469679.html C#读写三菱PLC和西门子PLC数据使用TCP/IP 协议https://blog.csdn.net/x ...
mysql安装问题（一）
mysql安装问题 mysql安装一直未响应问题: 原因: 解决方案: 登录mysql时提示密码错误问题: 解决方案: mysql安装问题 Author:母虎忠日期:April 26, 2019 ...
【Git之旅】1.Git常用命令
1.创建初始化版本库 git init 2.将文件添加到版本库中 git add index.html (添加到暂存区) git add . 命令让Git把当前目录及目录中的文件都添加到版本库里 gi ...
mac 下常用命令备忘录
1.查看端口号 lsof -i: 2.杀死进程 kill 41321 3.查看文件夹文件 ls ls -l //看到文件及文件夹更多的内容 ls -a //隐藏的文件 ls -la //上面的组合 4 ...
详解IPTABLES
详解IPTABLES Iptables 是Linux 内核集成的 IP 信息包过滤系统.如果Linux 系统连接到因特网或 LAN.服务器或连接 LAN 和因特网的代理服务器, 则该系统有利于在 Li ...
如何将Azure DevOps中的代码发布到Azure App Service中
标题:如何将Azure DevOps中的代码发布到Azure App Service中作者:Lamond Lu 背景最近做了几个项目一直在用Azure DevOps和Azure App Servi ...
dotnet core开源博客系统XBlog介绍
XBlog是dotnet core平台下的个人博客开源系统,它只需要通过Copy的方式即可以部署到Linux和windows系统中:如果你有安全证书那只需要简单配置一下即可提供安全的Https服务.接 ...
springcloud~配置中心的使用
配置中心作为springcloud里最底层的框架,所发挥的意思是举足轻重的,所以的组件的配置信息都可以通过springcloud config来管理,它会把配置信息分布式的存储到git上,所以信息安全 ...

resnet代码分析

resnet代码分析的更多相关文章

随机推荐

热门专题