Pytorch源码学习之七：torchvision.models.googlenet

2023-05-16

0.基本知识

torchvision.models.googlenet源码地址
GoogLeNet论文地址

Inception模块

注意，代码中第三个模块采取的3x3卷积而非5x5卷积，不知为何。
-GoogLeNet网络结构
GoogLeNet网络结构可视化

这里注意两个辅助的输出。

一、源码

import torch
import torch.nn as nn
import torch.nn.functional as F
import warnings
from collections import namedtuple
from torch.hub import load_state_dict_from_url

__all__ = ['GoogLeNet', 'googlenet']

model_urls = {
    # GoogLeNet ported from TensorFlow
    'googlenet': 'https://download.pytorch.org/models/googlenet-1378be20.pth',
}

_GoogLeNetOuputs = namedtuple('GoogLeNetOuputs', ['logits', 'aux_logits2', 'aux_logits1'])

class BasicBlock(nn.Module):
    def __init(self, in_channels, out_channels, **kwargs):
        super(BasicBlock, self).__init__()
        self.conv = nn.Conv2d(in_channels, out_channels, bias=False, **kwargs)
        self.bn = nn.BatchNorm2d(out_channels, eps=0.001)

    def forward(self, x):
        x = self.conv(x)
        x = self.bn(x)

        return F.relu(x, inplace=True)

class Inception(nn.Module):
    def __init__(self, in_channels, ch1x1, ch3x3red, ch3x3, ch5x5red, ch5x5, pool_proj):
        super(Inception, self).__init__()

        self.branch1 = BasicBlock(in_channels, ch1x1, kernel_size=1)

        self.branch2 = nn.Sequential(
            BasicBlock(in_channels, ch3x3red, kernel_size=1),
            BasicBlock(ch3x3red, ch3x3, kernel_size=3, padding=1)
        )

        self.branch3 = nn.Sequential(
            BasicBlock(in_channels, ch5x5red, kernel_size=1),
            BasicBlock(ch5x5red, ch5x5, kernel_size=3, padding=1)
        )

        self.branch4 = nn.Sequential(
            nn.MaxPool2d(kernel_size=3, stride=1, padding=1, ceil_mode=True),
            BasicBlock(in_channels, pool_proj, kernel_size=1)
        )

    def forward(self, x):
        branch1 = self.branch1(x)
        branch2 = self.branch2(x)
        branch3 = self.branch3(x)
        branch4 = self.branch4(x)

        outputs = [branch1, branch2, branch3, branch4]
        return torch.cat(outputs, 1)

class InceptionAux(nn.Module):

    def __init__(self, in_channels, num_classes):
        super(InceptionAux, self).__init__()
        self.conv = BasicBlock(in_channels, 128, kernel_size=1)

        self.fc1 = nn.Linear(2048, 1024)
        self.fc2 = nn.Linear(1024, num_classes)

    def forward(self, x):
        # aux1: N x 512 x 14 x 14, aux2: N x 528 x 14 x 14
        x = F.adaptive_avg_pool2d(x, (4, 4))
        # aux1 : N x 512 x 4 x 4, aux2 : N X 528 x 4 x 4
        x = self.conv(x)
        # N x 128 x 4 x 4
        x = x.view(x.size(0), -1)
        # N x 2048
        x = self.fc1(x)
        # N x 1024
        x = F.relu(x, inplace=True)
        x = F.dropout(x, 0.7, training=self.training)
        # N x 1024
        x = self.fc2(x)
        # N x num_classes
        return x

class GoogLeNet(nn.Module):

    def __init__(self, num_classes=1000, aux_logits=True, transform_input=False, init_weights=True):
        super(GoogLeNet, self).__init__()
        self.aux_logits = aux_logits
        self.transform_input = transform_input

        self.conv1 = BasicBlock(3, 64, kernel_size=7, stride=2, padding=3)
        self.maxpool1 = nn.MaxPool2d(3, stride=2, ceil_mode=True)
        self.conv2 = BasicBlock(64, 64, kernel_size=1)
        self.conv3 = BasicBlock(64, 192, kernel_size=3, padding=1)
        self.maxpool2 = nn.MaxPool2d(3, stride=2, ceil_mode=True)

        self.inception3a = Inception(192, 64, 96, 128, 16, 32, 32) #64+128+32+32=256
        self.inception3b = Inception(256, 128, 128, 192, 32, 96, 64) #128+192+96+64=480
        self.maxpool3 = nn.MaxPool2d(3, stride=2, ceil_mode=True)

        self.inception4a = Inception(480, 192, 96, 208, 16, 48, 64) # 192+208+48+64=512
        self.inception4b = Inception(512, 160, 112, 224, 24, 64, 64)#160+224+64+64=512
        self.inception4c = Inception(512, 128, 128, 256, 24, 64, 64)#128+256_64+64=512
        self.inception4d = Inception(512, 112, 144, 288, 32, 64, 64)#112+288+64+64=528
        self.inception4e = Inception(528, 256, 160, 320, 32, 128, 128)#256+320+128+128=832
        self.maxpool4 = nn.MaxPool2d(2, stride=2, ceil_mode=True)

        self.inception5a = Inception(832, 256, 160, 320, 32, 128, 128)#256+320+128+128=832
        self.inception5b = Inception(832, 384, 192, 384, 48, 128, 128)#384+384+128+128=1024

        if aux_logits:
            self.aux1 = InceptionAux(512, num_classes)
            self.aux2 = InceptionAux(528, num_classes)

        self.avgpool = nn.AdaptiveAvgPool2d((1, 1))
        self.dropout = nn.Dropout(0.2)
        self.fc = nn.Linear(1024, num_classes)

        if init_weights:
            self._initialize_weights()

    def _initialize_weights(self):
        for m in self.modules():
            if isinstance(m, nn.Conv2d) or isinstance(m, nn.Linear):
                import scipy.stats as stats
                X = stats.truncnorm(-2, 2, scale=0.01)
                values = torch.as_tensor(X.rvs(m.weight.numel()), dtype=m.weight.dtype)
                values = values.view(m.weight.size())
                with torch.no_grad():
                    m.weight.copy_(values)
            elif isinstance(m, nn.BatchNorm2d):
                nn.init.constant_(m.weight, 1)
                nn.init.constant_(m.bias, 0)

    def forward(self, x):
        if self.transform_input:
            x_ch0 = torch.unsqueeze(x[:, 0], 1) * (0.229 / 0.5) + (0.485 - 0.5) / 0.5
            x_ch1 = torch.unsqueeze(x[:, 1], 1) * (0.224 / 0.5) + (0.456 - 0.5) / 0.5
            x_ch2 = torch.unsqueeze(x[:, 2], 1) * (0.225 / 0.5) + (0.406 - 0.5) / 0.5
            x = torch.cat((x_ch0, x_ch1, x_ch2), 1)

        # N x 3 x 224 x 224
        x = self.conv1(x)
        # N x 64 x 112 x 112
        x = self.maxpool1(x)
        # N x 64 x 56 x 56
        x = self.conv2(x)
        # N x 64 x 56 x 56
        x = self.conv3(x)
        # N x 192 x 56 x 56
        x = self.maxpool2(x)

        # N x 192 x 28 x 28
        x = self.inception3a(x)
        # N x 256 x 28 x 28
        x = self.inception3b(x)
        # N x 480 x 28 x 28
        x = self.maxpool3(x)
        # N x 480 x 14 x 14
        x = self.inception4a(x)
        # N x 512 x 14 x 14
        if self.training and self.aux_logits:
            aux1 = self.aux1(x)

        x = self.inception4b(x)
        # N x 512 x 14 x 14
        x = self.inception4c(x)
        # N x 512 x 14 x 14
        x = self.inception4d(x)
        # N x 528 x 14 x 14
        if self.training and self.aux_logits:
            aux2 = self.aux2(x)

        x = self.inception4e(x)
        # N x 832 x 14 x 14
        x = self.maxpool4(x)
        # N x 832 x 7 x 7
        x = self.inception5a(x)
        # N x 832 x 7 x 7
        x = self.inception5b(x)
        # N x 1024 x 7 x 7

        x = self.avgpool(x)
        # N x 1024 x 1 x 1
        x = x.view(x.size(0), -1)
        # N x 1024
        x = self.dropout(x)
        x = self.fc(x)
        # N x 1000(num_classes)
        if self.training and self.aux_logits:
            return _GoogLeNetOuputs(x, aux2, aux1)
        return x

def googlenet(pretrained=False, progress=True, **kwargs):

    if pretrained:
        if 'transform_input' not in kwargs:
            kwargs['transform_input'] = True
        if 'aux_logits' not in kwargs:
            kwargs['aux_logits'] = False
        if kwargs['aux_logits']:
            warnings.warn('auxiliary heads in the pretrained googlenet model are NOT pretrained, '
                          'so make sure to train them')
        original_aux_logits = kwargs['aux_logits']
        kwargs['aux_logits'] = True
        kwargs['init_weights'] = False
        model = GoogLeNet(**kwargs)
        state_dict = load_state_dict_from_url(model_urls['googlenet'],
                                              progress=progress)
        model.load_state_dict(state_dict)
        if not original_aux_logits:
            model.aux_logits = False
            del model.aux1, model.aux2
        return model
    return GoogLeNet(**kwargs)

二、一些有趣的用法

1.collections.namedtuple

使用以下方式来返回辅助输出和最终输出，方便索引.

from collections import namedtuple
_GoogLeNetOuputs = namedtuple('GoogLeNetOuputs', ['logits', 'aux_logits2', 'aux_logits1'])
class GoogLeNet(nn.Module):
	...
	def forward(self, x):
		...
		if self.training and self.aux_logits:
            return _GoogLeNetOuputs(x, aux2, aux1)

warnings来返回自定义警告

import warnings
if pretrained:
	if kwargs['aux_logits']:
		warning.warn('your warnings')

本文内容由网友自发贡献，版权归原作者所有，本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容，请联系:hwhale#tublm.com(使用前将#替换为@)

Pytorch

torchvision

models

GoogLeNet

源码学习之七

Pytorch源码学习之七：torchvision.models.googlenet 的相关文章

PyTorch - 参数不变

为了了解 pytorch 的工作原理我尝试对多元正态分布中的一些参数进行最大似然估计然而它似乎不适用于任何协方差相关的参数所以我的问题是为什么这段代码不起作用 import torch def make covariance ma
“模块”对象没有属性“form_for_model”

当我使用属性时模型的表单我收到错误模块对象没有属性 form for model 我由此创建了该项目http www mikecantelon com q node 22 http www mikecantelon com q node
查找张量中沿轴的非零元素的数量

我想找到沿特定轴的张量中非零元素的数量有没有 PyTorch 函数可以做到这一点我尝试使用非零 http pytorch org docs master torch html highlight nonzero torch nonzer
如何在会话中运行多个图 - Tensorflow API

张量流API https github com tensorflow models tree master research object detection提供了一些预先训练的模型并允许我们使用任何数据集来训练它们我想知道如何在一个张
在pytorch中使用tensorboard，但得到空白页面？

我在pytorch 1 3 1中使用tensorboard 并且我在张量板的 pytorch 文档 https pytorch org docs stable tensorboard html 运行后tensorboard logdir r
将 CNN Pytorch 中的预训练权重传递到 Tensorflow 中的 CNN

我在 Pytorch 中针对 224x224 大小的图像和 4 个类别训练了这个网络 class CustomConvNet nn Module def init self num classes super CustomConvNet s
删除 Torch 张量中的行

我有一个火炬张量如下 a tensor 0 2215 0 5859 0 4782 0 7411 0 3078 0 3854 0 3981 0 5200 0 1363 0 4060 0 2030 0 4940 0 1640 0 6025 0
如何避免 PyTorch 中的“CUDA 内存不足”

我认为对于 GPU 内存较低的 PyTorch 用户来说这是一个非常常见的消息 RuntimeError CUDA out of memory Tried to allocate X MiB GPU X X GiB total capac
Model() 获得参数“nr_class”的多个值 - SpaCy 多分类模型（BERT 集成）

您好我正在致力于使用新的 SpaCy 模型实现多分类模型 5 类 en pytt bertbaseuncased lg 新管道的代码在这里 nlp spacy load en pytt bertbaseuncased lg textcat
django 查询所有相关集的过滤？

class Customer models Model name models CharField max length 200 class CustomerTicket models Model customer models OneTo
如何在pytorch中查看DataLoader中的数据

我在 Github 上的示例中看到类似以下内容如何查看该数据的类型形状和其他属性 train data MyDataset int 1e3 length 50 train iterator DataLoader train data b
LSTM 错误：AttributeError：“tuple”对象没有属性“dim”

我有以下代码 import torch import torch nn as nn model nn Sequential nn LSTM 300 300 nn Linear 300 100 nn ReLU nn Linear 300 7
Ruby NoMethodError - BlahController 的未定义方法“blah_url”

我从链接调用这个js function createNewTopLevelEntry var user id user val var header prompt Enter the name ajax users user id entr
从打包序列中获取每个序列的最后一项

我试图通过 GRU 放置打包和填充的序列并检索每个序列最后一项的输出当然我的意思不是 1项目但实际上是最后一个未填充的项目我们预先知道序列的长度因此应该很容易为每个序列提取length 1 item 我尝试了以下方法 impor
下载变压器模型以供离线使用

我有一个训练有素的 Transformer NER 模型我想在未连接到互联网的机器上使用它加载此类模型时当前会将缓存文件下载到 cache 文件夹要离线加载并运行模型需要将 cache 文件夹中的文件复制到离线机器上然而这些文
pytorch 中的 keras.layers.Masking 相当于什么？

我有时间序列序列我需要通过将零填充到矩阵中并在 keras 中使用 keras layers Masking 来将序列的长度固定为一个数字我可以忽略这些填充的零以进行进一步的计算我想知道它怎么可能在 Pytorch 中完成要么我需要
BatchNorm 动量约定 PyTorch

Is the 批归一化动量约定 http pytorch org docs master modules torch nn modules batchnorm html 默认 0 1 与其他库一样正确例如Tensorflow默认情况下似乎
如何计算 CNN 第一个线性层的维度

目前我正在使用 CNN 其中附加了一个完全连接的层并且我正在使用尺寸为 32x32 的 3 通道图像我想知道是否有一个一致的公式可以用来计算第一个线性层的输入尺寸和最后一个卷积最大池层的输入我希望能够计算第一个线性层的尺寸仅给出
在 ASP.NET MVC3 中，应该如何呈现由多个模型支持的多个 PartialView？

在 MVC3 Razor 中如何创建具有多个表单的页面以便每个表单都是使用自己的模型渲染的部分视图我们一直在尝试各种形式的调用 Html RenderPartial 传入部分视图名称以及我们通过 ViewBag 访问的模型实例但我们
PyTorch 中的交叉熵

交叉熵公式但为什么下面给出loss 0 7437代替loss 0 since 1 log 1 0 import torch import torch nn as nn from torch autograd import Variable

随机推荐

Pycharm快捷键及使用技巧

一基本设置二调试三快捷键快捷键操作Ctrl 43 点击查看源码Ctrl 43 Q查看代码docCtrl 43 Shift 43 I查看代码源码Shift 43 Enter向下另起一行 xff0c 光标在行内任意位置都能另起一行
CVPR 2020: Back to the Future: Joint Aware Temporal Deep Learning 3D Human Pose Estimation 论文阅读随笔

论文网址 Github
CVPR 2020: VIBE: Video Inference for Human Body Pose and Shape Estimation 阅读随笔

论文地址 Github地址以下为我的OneNote阅读笔记 xff0c 为图片格式 xff0c 留言邮件可发原文件
CVPR2020: GhostNet: More Features from Cheap Operations 论文阅读随笔

参考地址 xff1a 论文地址 Github地址以下为我的阅读OneNote笔记为图片格式原文件可留言私信获取如有问题 xff0c 可留言讨论
CVPR2020 Oral: PolarMask: Single Shot Instance Segmentation with Polar Representation 论文阅读随笔

论文原文 Github代码作者本人的解读以下为我自己的阅读笔记 xff0c 为OneNote图片格式 xff0c 留言或私信可获取原文件 xff0c 欢迎讨论
Pytorch源码学习之一： torchvision.models.alexnet

Pytorch源码学习之一 torchvision models alexnet torch中一行代码导入的alexnet配置如下 xff1a 64 64 11x11 stride 61 4 43 ReLU 43 Maxpooling 3x
CVPR2020: Suppressing Uncertainties for Large-Scale Facial Expression Recognition 阅读随笔

0 Abstract 大规模表情识别 large scale Facial Expression Recognition FER 的主要挑战在于不确定性 uncertainties xff0c 这些不确定性来源于模棱两可的面部表情 ambi
CSS字体加粗总结

CSS 加粗知识与CSS 加粗实例 DIV 43 CSS基础知识 CSS 加粗这里指的是通过DIV CSS控制对象的加粗使用CSS属性单词 font weight 对象值 xff1a 从100到900 xff0c 最常用font weig
Python argparse用法详情

在神经网络训练中 xff0c argparse的方法可以让改变参数模型超参文件位置 GPU等更加方便一 argparse使用步骤 Step1 导入argparse模块 span class token keyword import
Python time获取各种格式的时间

一时间戳格式 span class token keyword import span time start span class token operator 61 span time span class token punctuat
CVPR2020: CenterMask:Real-Time Anchor-Free Instance Segmentation 阅读随笔
Pytorch源码学习之二：torchvision.models.vgg

0 VGG的网络结构一 torchvision源码这种通过配置文件一次性搭建相似网络的结构的方法十分值得学习和模仿这也是相对于AlexNet的实现过程不同之处我对其做了一丁点修改 xff0c 源码网址可见torchvision mo
ICCV 2019: FCOS: Fully Convolutional One-Stage Object Detection论文阅读笔记
Pytorch源码学习之三：torchvision.models.resnet

一网络结构 1 BasicBlock 2 BootleNeck和group convolution 3 Dilated Convolution with a 3 x 3 kernel and dilation rate 2 二 torch
python将多帧图片组合成视频

span class token keyword import span cv2 span class token keyword import span os span class token keyword import span ra
Pytorch源码学习之四：torchvision.models.squeezenet

0 介绍 Squeezenet网址 torchvision model squeeze官方文档主要思想 xff1a 堆叠Fire模块 xff0c 每个Fire模块 xff0c 分别采用1x1和3x3两个分支 xff0c 最后做拼 xff1
Pytorch源码学习之五：torchvision.models.densenet

0 基本知识 DenseNet论文地址 DenseNet加强了每个Dense Block内部的连接 xff0c 每层输出与之前所有层进行concat连接 xff0c 使用三个Dense Block的网络示意图如下 xff1a 每个Block
Pytorch源码学习之六：torchvision.models.inception_v3

0 参考和简介 torchvision models inception v3源码实现的论文地址部分网络结构 xff1a InceptionA InceptionC InceptionE 一源码 span class token co
设备管理信息系统

设备管理系统设备管理系统 xff08 Equipment Management System xff09 是将信息化了设备技术信息与现代化管理相结合 xff0c 是实现研究级管理信息化的先导设备管理软件是设备管理模式与计算机技术结合的产
Pytorch源码学习之七：torchvision.models.googlenet

0 基本知识 torchvision models googlenet源码地址 GoogLeNet论文地址 Inception模块注意 xff0c 代码中第三个模块采取的3x3卷积而非5x5卷积 xff0c 不知为何 GoogLeNet网

Pytorch源码学习之七：torchvision.models.googlenet

0.基本知识

一、源码

二、一些有趣的用法

1.collections.namedtuple

warnings来返回自定义警告

Pytorch源码学习之七：torchvision.models.googlenet 的相关文章

随机推荐

热门标签