Pytorch实现ResNet

2023年7月13日下午11:57 • 人工智能 • 阅读 59

ResNet网络模型

import torch
import torch.nn as nn

class BaicsBlock(nn.Module):

    def expansion(self):
        expansion = 1
        return expansion

    def __init__(self, in_channel, out_channel, stride=1, downsample=None):
        super(BaicsBlock, self).__init__()
        self.conv1 = nn.Conv2d(in_channels=in_channel,
                               out_channels=out_channel,
                               kernel_size=3,
                               stride=stride,
                               padding=1,
                               bias=False)
        self.bn1 = nn.BatchNorm2d(out_channel)
        self.relu =nn.ReLU(inplace=True)
        self.conv2 = nn.Conv2d(in_channels=out_channel,
                               out_channels=out_channel,
                               kernel_size=3,
                               stride=stride,
                               padding=1,
                               bias=False)
        self.bn2 = nn.BatchNorm2d(out_channel)
        self.downsample = downsample

    def forward(self, x):

        identity = x
        if self.downsample is not None:
            identity = self.downsample(x)

        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu(x)

        x = self.conv2(x)
        x = self.bn2(x)
        x +=identity
        x = self.relu(x)

        return x

class Bottleneck(nn.Module):
    def expansion(self):
        expansion = 4
        return expansion

    def __bool__(self, in_channel, out_channel, stride=1, downsample=None):
        super(Bottleneck, self).__init__()
        self.conv1 = nn.Conv2d(in_channels=in_channel,
                               out_channels=out_channel,
                               kernel_size=1,
                               stride=1,
                               padding=1,
                               bias=False)
        self.bn1 = nn.BatchNorm2d(out_channel)
        self.relu = nn.ReLU(inplace=True)
        self.conv2 = nn.Conv2d(in_channels=out_channel,
                               out_channels=out_channel,
                               kernel_size=3,
                               stride=stride,
                               padding=1,
                               bias=False)
        self.bn2 = nn.BatchNorm2d(out_channel)
        self.conv3 = nn.Conv2d(in_channels=out_channel,
                               out_channels=out_channel,
                               kernel_size=1,
                               stride=1,
                               padding=1,
                               bias=False)
        self.bn3 = nn.BatchNorm2d(out_channel*self.expansion())
        self.downsample = downsample

    def forward(self, x):
        identity = x
        if self.downsample is not None:
            identity = self.downsample(x)

        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu(x)

        x = self.conv2(x)
        x = self.bn2(x)
        x = self.relu(x)

        x = self.conv3(x)
        x = self.bn3(x)
        x += identity
        x = self.relu(x)

        return x

class ResNet(nn.Module):
    def __init__(self, block, block_list, num_classes=1000, include_top=True):
        super(ResNet, self).__init__()
        self.include_top = include_top
        self.in_channel = 64

        self.conv1 = nn.Conv2d(in_channels=3,
                               out_channels=self.in_channel,
                               kernel_size=7,
                               stride=2,
                               padding=3,
                               bias=False)
        self.bn1 = nn.BatchNorm2d(self.in_channel)
        self.relu = nn.ReLU(inplace=True)
        self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2)

        self.layer_1 = self.make_layer(block, 64, block_list[0])
        self.layer_2 = self.make_layer(block, 128, block_list[1], stride=2)
        self.layer_3 = self.make_layer(block, 256, block_list[2], stride=2)
        self.layer_4 = self.make_layer(block, 512, block_list[3], stride=2)
        if self.include_top:
            self.avgpool = nn.AdaptiveAvgPool1d((1,1))
            self.fc = nn.Linear(512 * block.expansion(self), num_classes)

        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')

    def make_layer(self, block, channel, block_list, stride=1):
        downsample = None
        if stride != 1 or self.in_channel != channel * block.expansion(self):
            downsample = nn.Sequential(
                nn.Conv2d(self.in_channel, channel * block.expansion(self), kernel_size=1, stride=stride, bias=False),
                nn.BatchNorm2d(channel * block.expansion(self)))

        layers = []
        layers.append(block(self.in_channel, channel, downsample=downsample, stride=stride))
        self.in_channel = channel * block.expansion(self)

        for _ in range(1, block_list):
            layers.append(block(self.in_channel, channel))

        return nn.Sequential(*layers)

    def forward(self, x):
        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu(x)
        x = self.maxpool(x)

        x = self.layer_1(x)
        x = self.layer_2(x)
        x = self.layer_3(x)
        x = self.layer_4(x)

        if self.include_top:
            x = self.avgpool(x)
            x = torch.flatten(x, 1)
            x = self.fc(x)

        return x
def ResNet18(num_classes=1000, include_top=True):
    return ResNet(BaicsBlock, [2, 2, 2, 2], num_classes=num_classes, include_top=include_top)
def ResNet34(num_classes=1000, include_top=True):
    return ResNet(BaicsBlock, [3, 4, 6, 3], num_classes=num_classes, include_top=include_top)
def ResNet50(num_classes=1000, include_top=True):
    return ResNet(Bottleneck, [3, 4, 6, 3], num_classes=num_classes, include_top=include_top)
def ResNet101(num_classes=1000, include_top=True):
    return ResNet(Bottleneck, [3, 4, 23, 3], num_classes=num_classes, include_top=include_top)
def ResNet152(num_classes=1000, include_top=True):
    return ResNet(Bottleneck, [3, 8, 36, 3], num_classes=num_classes, include_top=include_top)

ResNet网络训练（5分类的花分类）

from nlp.task.CIFAR10_try.ResNet import ResNet34
import os
import json
import torch
import torch.nn as nn
import torch.optim as optim
from torchvision import transforms, datasets
from tqdm import tqdm
def main():

    device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
    print("using {} device.".format(device))

    data_transform = {
        "train": transforms.Compose([transforms.RandomResizedCrop(224),
                                     transforms.RandomHorizontalFlip(),
                                     transforms.ToTensor(),
                                     transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])]),
        "val": transforms.Compose([transforms.Resize(256),
                                   transforms.CenterCrop(224),
                                   transforms.ToTensor(),
                                   transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])])}

    data_root = os.path.abspath(os.path.join(os.getcwd(), "../.."))
    image_path = os.path.join(data_root, "data_set", "flower_data")
    assert os.path.exists(image_path), "{} path does not exist.".format(image_path)

    train_dataset = datasets.ImageFolder(root=os.path.join(image_path, "train"),
                                         transform=data_transform["train"])
    train_num = len(train_dataset)

    flower_list = train_dataset.class_to_idx
    cla_dict = dict((val, key) for key, val in flower_list.items())

    json_str = json.dumps(cla_dict, indent=4)
    with open('class_indices.json', 'w') as json_file:
        json_file.write(json_str)

    batch_size = 16
    nw = min([os.cpu_count(), batch_size if batch_size > 1 else 0, 8])
    print('Using {} dataloader workers every process'.format(nw))

    train_loader = torch.utils.data.DataLoader(train_dataset,
                                               batch_size=batch_size, shuffle=True,
                                               num_workers=nw)

    validate_dataset = datasets.ImageFolder(root=os.path.join(image_path, "val"),
                                            transform=data_transform["val"])
    val_num = len(validate_dataset)
    validate_loader = torch.utils.data.DataLoader(validate_dataset,
                                                  batch_size=batch_size, shuffle=False,
                                                  num_workers=nw)

    print("using {} images for training, {} images for validation.".format(train_num,
                                                                           val_num))

    net = ResNet34()
    model_weight_path = "./resnet34-pre.pth"
    assert os.path.exists(model_weight_path), "file {} does not exist.".format(model_weight_path)
    net.load_state_dict(torch.load(model_weight_path, map_location=device))
    in_channel = net.fc.in_features
    net.fc = nn.Linear(in_channel, 5)
    net.to(device)

    loss_function = nn.CrossEntropyLoss()
    params = [p for p in net.parameters() if p.requires_grad]
    optimizer = optim.Adam(params, lr=0.0001)

    epochs = 5
    best_acc = 0.0
    save_path = './resNet34.pth'
    train_steps = len(train_loader)
    for epoch in range(epochs):

        net.train()
        running_loss = 0.0
        train_bar = tqdm(train_loader)
        for step, data in enumerate(train_bar):
            images, labels = data
            optimizer.zero_grad()
            logits = net(images.to(device))
            loss = loss_function(logits, labels.to(device))
            loss.backward()
            optimizer.step()

            running_loss += loss.item()

            train_bar.desc = "train epoch[{}/{}] loss:{:.3f}".format(epoch + 1,
                                                                     epochs,
                                                                     loss)

        net.eval()
        acc = 0.0
        with torch.no_grad():
            val_bar = tqdm(validate_loader)
            for val_data in val_bar:
                val_images, val_labels = val_data
                outputs = net(val_images.to(device))

                predict_y = torch.max(outputs, dim=1)[1]
                acc += torch.eq(predict_y, val_labels.to(device)).sum().item()

                val_bar.desc = "valid epoch[{}/{}]".format(epoch + 1,
                                                           epochs)

        val_accurate = acc / val_num
        print('[epoch %d] train_loss: %.3f  val_accuracy: %.3f' %
              (epoch + 1, running_loss / train_steps, val_accurate))

        if val_accurate > best_acc:
            best_acc = val_accurate
            torch.save(net.state_dict(), save_path)

    print('Finished Training')

if __name__ == '__main__':
    main()

Original: https://blog.csdn.net/qq_51778415/article/details/115795522
Author: 殇小气
Title: Pytorch实现ResNet

原创文章受到原创版权保护。转载请注明出处：https://www.johngo689.com/690880/

转载文章受原作者版权保护。转载请注明原作者出处！

人工智能

【自取】最近整理的，有需要可以领取学习：

Linux核心资料大放送~

全栈面试题汇总（持续更新&可下载）

一个提高学习100%效率的工具！

【超详细】深度学习面试题目！

LeetCode Python刷题答案下载！

LeetCode Java版刷题答案下载！

LeetCode C++ 版本，抓紧保存！

LeetCode GO语言刷题答案下载！

OpenCV-Python实战（3）——OpenCV中绘制图形与文本

[ OpenCV_是一款非常强大的计算机视觉库，其 _中_包含了很多功能强大的 _图像处理_和计算机视觉算法。而在这个系列的第三篇文章 _中，我们将重点介绍如何在 OpenCV 中…

人工智能 2023年6月18日
00104
机器学习-分类聚类预测系统

这是机器学习课程的一个课设,具体的课设要求如下: 1.熟悉机器学习的完整流程，包括：问题建模，获取数据，特征工程，模型训练，模型调优，线上运行；或者分为三大块：数据准备与预处理，模…

人工智能 2023年5月31日
00107
MATLAB基础教程（10）——二维中的数据可视化

目录 MATLAB数据可视化绘图在同一个figure里面绘制多个图形本期小结 MATLAB数据可视化绘图绘制图形（二维）一般使用plot函数，这个函数一般能满足很多画图的…

人工智能 2023年6月22日
0067
机器学习实战第九章笔记——树回归

目录引言一、复杂数据的局部性建模二、连续和离散型特征的树的构建三、将cart算法用于回归 3.1 构建树编辑四、树剪枝 4.1 预剪枝 4.2 后剪枝五、树模型六、…

人工智能 2023年6月18日
0093
Mediapipe入门——搭建姿态检测模型并实时输出人体关节点3d坐标

一. 引言MediaPipe 是一款由 Google Research 开发并开源的多媒体机器学习模型应用框架。在谷歌，一系列重要产品，如 YouTube、Google Lens、…

人工智能 2023年7月20日
0070
无人机+强化学习开源项目、工具包汇总

写在最前：科研小废物一枚，在搞强化学习+无人机，以下内容均为我的导师在github上给我找到的开源项目/工具包，仅供参考。P.s：目前只是做一个汇总，并没有按个安装与尝试，DDDD…

人工智能 2023年6月16日
0098
机器学习-第2关：信息熵与信息增益

import numpy as np def calcInfoGain(feature, label, index): ”’ 计算信息增益 :param f…

人工智能 2023年7月28日
0073
halcon模板匹配 ——多个不同对象同时匹配

文章目录场景效果实现步骤 * 1.读取图像 2.分别生成两个ROI 3.分别创建各向同性比例缩放形状模板 4.分别获取形状模型的轮廓表示 5.连接两个模板轮廓XLD 6.保存…

人工智能 2023年5月28日
00214
[深度学习理论]通俗理解BatchNormalization

如图所示，对于一层神经网络来说，当神经元(X_2)的range远远大于(X_1)时，加权后得到的输出(a)会极大的收到神经元(W_2*X_2)的影响，即(W_2)的大小会极大的影响…

人工智能 2023年6月6日
0078
人脸识别太常见？好用才行，利尔达推出一体化人脸识别解决方案

人脸识别技术对输入的人脸图像或者视频流进行处理，是一种通过提取每张人脸中的特征信息进行身份鉴别的前沿识别技术。伴随着智能化时代的悄然到来，人脸识别技术日益普及并被大规模地应用于日…

人工智能 2023年7月12日
0051
全连接层tf.keras.layers.Dense()介绍

函数原型 tf.keras.layers.Dense( units, activation=None, use_bias=True, kernel_initializer=’glo…

人工智能 2023年7月13日
0053
【吴恩达deeplearning.ai】Course 5 – 2.5 学习词嵌入

学习词嵌入 (Learning Word Embeddings) 在本节视频中，你将要学习一些具体的算法来学习词嵌入。在深度学习应用于学习词嵌入的历史上，人们一开始使用的算法比较复…

人工智能 2023年5月28日
0096
2022年全球程序员薪资排行出炉：中国倒数第九，GO最赚钱

今年七月，CodeSubmit 统计分析了 27个软件开发比较活跃的国家的程序员的薪资情况，美国、瑞士、以色列位列前三，美国程序员的平均薪资达到了110140美元，折合人民币约80…

人工智能 2023年6月28日
0086
Deformable DETR环境配置和应用

准备工作： Deformable DETR代码路径如下： GitHub – fundamentalvision/Deformable-DETR: Deformable …

人工智能 2023年7月9日
0079
自然语言理解难在哪儿？

自然语言理解任务的本质是结构预测，关键则是对语言单元的语义表示能力。 1.1 自然语言理解本质是结构预测自然语言文本是典型的无结构数据，由语言符号（如汉字）序列构成。要实现对自…

人工智能 2023年5月28日
00105
PyQt5中的QtGui.QImage图片显示问题分析

前言 PyQt是Python语言环境的GUI编程解决方案之一，另外还有PyGTK、wxPython等也较为常用。PyQt作为Qt语言的Python扩展，可以用来方便快速的开发界面应…

人工智能 2023年6月19日
00108

2024 年 5 月
一	二	三	四	五	六	日
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31

Pytorch实现ResNet

大家都在看