PyTorch学习笔记（5）–mnist数据集训练

2023年7月14日上午1:40 • 人工智能 • 阅读 49

from __future__ import print_function
import os
import struct
import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.autograd import Variable
import torch.optim as optim
import matplotlib.pyplot as plt
def load_mnist(path,kind='train'):
    labels_path=os.path.join(path,'%s-labels.idx1-ubyte/%s-labels.idx1-ubyte'%(kind,kind))
    images_path = os.path.join(path, '%s-images.idx3-ubyte/%s-images.idx3-ubyte' % (kind, kind))
    # labels_path = os.path.join(path, '%s-labels.idx1-ubyte' % kind)
    # images_path=os.path.join(path,'%s-images.idx3-ubyte'%kind)
    with open(labels_path,'rb') as lbpath:
        magic,n=struct.unpack('>II',lbpath.read(8))
        labels=np.fromfile(lbpath,dtype=np.uint8)
    with open(images_path,'rb') as imgpath:
        magic,num,rows,cols=struct.unpack(">IIII",imgpath.read(16))
        # labels=np.array(labels)
        images=np.fromfile(imgpath,dtype=np.uint8).reshape(len(labels),784)
    return images,labels
X_train,y_train =load_mnist('./data',kind='train')
print('Rows:%d,columns:%d'%(X_train.shape[0],X_train.shape[1]))
X_test,y_test=load_mnist('./data',kind='t10k')
print('Rows:%d,columns:%d'%(X_train.shape[0],X_train.shape[1]))
batch_size=100
num_classes=10
epochs=2
input image dimensions
img_rows,img_cols =28,28
train_losses=[]
test_losses=[]
test_counter=[]
train_counter=[]
x_train=X_train
x_test=X_test
if 'channels_first'=='channels_first':
    x_train=x_train.reshape(x_train.shape[0],1,img_rows,img_cols)#样本，通道，高度，宽度
    x_test=x_test.reshape(x_test.shape[0],1,img_rows,img_cols)
    input_shape=(1,img_rows,img_cols)
else:
    x_train=x_train.reshape(x_train.shape[0],img_rows,img_cols,1)
    x_test = x_test.reshape(x_test.shape[0], img_rows, img_cols, 1)
    input_shape=(img_rows,img_cols,1)
x_train=x_train.astype('float32')
x_test=x_test.astype('float32')
x_train/=255
x_test/=255
print('x_train shape:',x_train.shape)
print(x_train.shape[0],'x_train samples')
print(y_train.shape[0],'y_train samples')
print(x_test.shape[0],'x_test samples')
print(y_test.shape[0],'y_test samples')
num_samples=x_train.shape[0]
print("num_samples:",num_samples)
'''
build torch model
'''
class Net(nn.Module):
    def __init__(self):
        super(Net,self).__init__()
        #(5,5)卷积核
        self.conv1=nn.Conv2d(1,10,kernel_size=5)#将1通道的图像数据的输入卷积成10个神经元，这一个通道会和10个神经元都建立连接
        self.conv2=nn.Conv2d(10,20,kernel_size=5)#将10通道的图像数据的输入卷积成20个神经元，这10个通道会和20个神经元都建立连接
        # self.conv1 = nn.Conv2d(1, 32, kernel_size=5)
        # self.conv2 = nn.Conv2d(32, 64, kernel_size=5)
        self.conv2_drop=nn.Dropout2d()#抛弃部分数据
        #self.fc1=nn.Linear(320,50)
        self.fc1 = nn.Linear(10*6*6, 50)
        self.fc2=nn.Linear(50,10)#两个全连接层
    def forward(self,x):
        x=F.relu(F.max_pool2d(self.conv1(x),2))#池化成最大值，池化核为（2，2）
        x=F.relu(F.max_pool2d(self.conv2_drop(self.conv2_drop(x)),2))
        x=x.view(-1,10*6*6)#动态调整这个维度上的元素个数以保证元素的总数不变
        x=F.relu(self.fc1(x))
        x=F.dropout(x,training=self.training)
        x=self.fc2(x)
        return F.log_softmax(x,dim=1)#图像分类的损失函数
model=Net()
if os.path.exists('mnist_torch.pkl'):
    model=torch.load('mnist_torch.pkl')
print(model)

'''
trainning
'''
optimizer=optim.SGD(model.parameters(),lr=0.01,momentum=0.5)
def train(epoch,x_train,y_train):
    num_batchs=num_samples/batch_size
    model.train()
    num_batchs=int(num_batchs)
    for k in range(num_batchs):
        start,end=k*batch_size,(k+1)*batch_size
        data,target=Variable(x_train[start:end],requires_grad=False),Variable(y_train[start:end])
        optimizer.zero_grad()
        output=model(data)
        loss=F.nll_loss(output,target)
        loss.backward()
        optimizer.step()
        if k%10==0:
            print('Train Epoch:{}[{}/{}({:.0f}%)]\tLoss:{:.6f}'.format(epoch,k*len(data),num_samples,100.*k/num_samples,loss.item()))
            train_losses.append(loss.item())
            train_counter.append((k*64)+((epoch-1)*len(data)))
    torch.save(model,'mnist_torch.pkl')

'''
evaluate
'''
def test(epoch):
    model.eval()
    test_loss=0
    correct=0
    if 2>1:
        with torch.no_grad():
            data,target=Variable(x_test),Variable(y_test)
        #data,target=Variable(x_test,volatile=True),Variable(y_test)
        output=model(data)
        test_loss+=F.nll_loss(output,target).item()
        test_losses.append(test_loss)
        # for i in range(epochs+1):
        #     test_counter.append(i*len(data))
        test_counter.append( len(data))
        # test_counter=[i*len(data) for i in range(epochs+1)]
        # print(test_loss)
        # print(len((x_test)))
        pred=output.data.max(1)[1]
        correct+=pred.eq(target.data).cpu().sum()
    #test_loss/=len(x_test)
    print('\nTest set:Average loss:{:.4f},Accuracy:{}/{}({:.0f}%)\n'.format(test_loss,correct,len(x_test),100.*correct/len(x_test)))
x_train=torch.from_numpy(x_train).float()
x_test=torch.from_numpy(x_test).float()
y_train=torch.from_numpy(y_train).long()
y_test=torch.from_numpy(y_test).long()
for epoch in range(1,epochs):
    train(epoch,x_train,y_train)
    test(epoch)
'''
painting
'''
fig= plt.figure()
plt.plot(train_counter,train_losses,color='blue')
plt.scatter(test_counter,test_losses,color='red')
plt.legend(['Train Loss', 'Test Loss'], loc='upper right')
plt.xlabel('number of training examples seen')
plt.ylabel('negative log likelihood loss')
plt.show()

得到结果：（多次训练后的结果，每次训练得到的结果不同）

Rows:60000,columns:784
Rows:60000,columns:784
x_train shape: (60000, 1, 28, 28)
60000 x_train samples
60000 y_train samples
10000 x_test samples
10000 y_test samples
num_samples: 60000
Net(
(conv1): Conv2d(1, 10, kernel_size=(5, 5), stride=(1, 1))
(conv2): Conv2d(10, 20, kernel_size=(5, 5), stride=(1, 1))
(conv2_drop): Dropout2d(p=0.5, inplace=False)
(fc1): Linear(in_features=360, out_features=50, bias=True)
(fc2): Linear(in_features=50, out_features=10, bias=True)
)
Train Epoch:1[0/60000(0%)] Loss:0.378188
Train Epoch:1[1000/60000(0%)] Loss:0.766636
Train Epoch:1[2000/60000(0%)] Loss:0.662513
Train Epoch:1[3000/60000(0%)] Loss:0.674844
Train Epoch:1[4000/60000(0%)] Loss:0.374800
Train Epoch:1[5000/60000(0%)] Loss:0.466920
Train Epoch:1[6000/60000(0%)] Loss:0.474571
Train Epoch:1[7000/60000(0%)] Loss:0.589114
Train Epoch:1[8000/60000(0%)] Loss:0.557918
Train Epoch:1[9000/60000(0%)] Loss:0.316381
Train Epoch:1[10000/60000(0%)] Loss:0.515177
Train Epoch:1[11000/60000(0%)] Loss:0.336269
Train Epoch:1[12000/60000(0%)] Loss:0.458744
Train Epoch:1[13000/60000(0%)] Loss:0.630309
Train Epoch:1[14000/60000(0%)] Loss:0.698837
Train Epoch:1[15000/60000(0%)] Loss:0.519987
Train Epoch:1[16000/60000(0%)] Loss:0.631619
Train Epoch:1[17000/60000(0%)] Loss:0.646146
Train Epoch:1[18000/60000(0%)] Loss:0.692150
Train Epoch:1[19000/60000(0%)] Loss:0.635705
Train Epoch:1[20000/60000(0%)] Loss:0.465035
Train Epoch:1[21000/60000(0%)] Loss:0.415029
Train Epoch:1[22000/60000(0%)] Loss:0.412988
Train Epoch:1[23000/60000(0%)] Loss:0.583587
Train Epoch:1[24000/60000(0%)] Loss:0.593450
Train Epoch:1[25000/60000(0%)] Loss:0.530810
Train Epoch:1[26000/60000(0%)] Loss:0.570838
Train Epoch:1[27000/60000(0%)] Loss:0.474587
Train Epoch:1[28000/60000(0%)] Loss:0.456399
Train Epoch:1[29000/60000(0%)] Loss:0.559481
Train Epoch:1[30000/60000(0%)] Loss:0.441676
Train Epoch:1[31000/60000(1%)] Loss:0.546501
Train Epoch:1[32000/60000(1%)] Loss:0.662970
Train Epoch:1[33000/60000(1%)] Loss:0.598461
Train Epoch:1[34000/60000(1%)] Loss:0.529693
Train Epoch:1[35000/60000(1%)] Loss:0.492719
Train Epoch:1[36000/60000(1%)] Loss:0.541546
Train Epoch:1[37000/60000(1%)] Loss:0.877233
Train Epoch:1[38000/60000(1%)] Loss:0.443502
Train Epoch:1[39000/60000(1%)] Loss:0.315365
Train Epoch:1[40000/60000(1%)] Loss:0.523321
Train Epoch:1[41000/60000(1%)] Loss:0.494766
Train Epoch:1[42000/60000(1%)] Loss:0.587744
Train Epoch:1[43000/60000(1%)] Loss:0.607159
Train Epoch:1[44000/60000(1%)] Loss:0.575720
Train Epoch:1[45000/60000(1%)] Loss:0.761669
Train Epoch:1[46000/60000(1%)] Loss:0.535713
Train Epoch:1[47000/60000(1%)] Loss:0.402516
Train Epoch:1[48000/60000(1%)] Loss:0.527466
Train Epoch:1[49000/60000(1%)] Loss:0.652991
Train Epoch:1[50000/60000(1%)] Loss:0.438617
Train Epoch:1[51000/60000(1%)] Loss:0.314596
Train Epoch:1[52000/60000(1%)] Loss:0.697034
Train Epoch:1[53000/60000(1%)] Loss:0.533702
Train Epoch:1[54000/60000(1%)] Loss:0.569537
Train Epoch:1[55000/60000(1%)] Loss:0.375768
Train Epoch:1[56000/60000(1%)] Loss:0.473715
Train Epoch:1[57000/60000(1%)] Loss:0.612956
Train Epoch:1[58000/60000(1%)] Loss:0.484374
Train Epoch:1[59000/60000(1%)] Loss:0.285547
Test set:Average loss:0.1313,Accuracy:9600/10000(96%)

得到train_loss曲线和test_loss点：

读者自己跑代码时若遇到问题：

PermissionError: [Errno 13] Permission denied: ‘./data\train-labels.idx1-ubyte’

请读者移步至笔者所写另一篇博客：(1条消息) 解决PermissionError: [Errno 13] Permission denied: ‘./data\train-labels.idx1-ubyte’_别管我啦就是说的博客-CSDN博客 PyTorch学习笔记（5）--mnist数据集训练 https://blog.csdn.net/m0_61385981/article/details/124309779?spm=1001.2014.3001.5502 ;

若读者需要查看mnist数据集内容：

import cv2
for i in range(60000):
    image1 = X_train[i]
    image1 = image1.astype('float32')
    image1 = image1.reshape(28, 28, 1)
    cv2.imwrite('./img/'+str(i)+".jpg", image1

mnist数据集下载网址：

http://yann.lecun.com/exdb/mnist/

参考书籍：《PyTorch深度学习实战》

Original: https://blog.csdn.net/m0_61385981/article/details/124335227
Author: 别管我啦就是说
Title: PyTorch学习笔记（5）–mnist数据集训练

原创文章受到原创版权保护。转载请注明出处：https://www.johngo689.com/691040/

转载文章受原作者版权保护。转载请注明原作者出处！

人工智能

【自取】最近整理的，有需要可以领取学习：

Linux核心资料大放送~

全栈面试题汇总（持续更新&可下载）

一个提高学习100%效率的工具！

【超详细】深度学习面试题目！

LeetCode Python刷题答案下载！

LeetCode Java版刷题答案下载！

LeetCode C++ 版本，抓紧保存！

LeetCode GO语言刷题答案下载！

特征工程-2-文本表示模型

TF-IDF（term frequency–inverse document frequency）是一种用于信息检索与数据挖掘的常用加权技术，常用于挖掘文章中的关键词，而且算法简单…

人工智能 2023年6月4日
0075
利用Jupyter Notebook进行科学计算和数据分析

Jupyter Notebook Jupyter Notebook 作为一个编辑器，非常的受欢迎。它的代码和输出结果都保存在同一个文件中。需要时直接发一个文件就能在其它电脑快速运行…

人工智能 2023年7月15日
00130
DataFrame索引的创建与基础用法

DataFrame 是一个表格型的数据结构（数据框），它含有一组有序的列，每列可以是不同的数据类型。DataFrame 既有行索引，也有列索引，可以看作是由多个Series索引组成…

人工智能 2023年7月16日
0064
模式识别使用Fish分类算法和感知器分类算法——数据集可视化和特征选择

一、数据集简介本次实验所选取的数据集为：CORK_STOPPERS.xls数据集，即软木塞数据集。该数据即可在《模式识别》第三版书中的链接下载，也可在我的主页内下载。下图为本…

人工智能 2023年7月17日
0087
【论文&模型讲解】CLIP（Learning Transferable Visual Models From Natural Language Supervision）

文章目录前言 0 摘要 1 Introduction and Motivating Work 2 Approach * 2.0 模型整体结构 2.1 数据集 2.2 选择一种高效…

人工智能 2023年7月27日
00112
人工智能相关技术将首先在互联网行业开始应用，然后陆续普及到其他行业

人工智能（Artificial Intelligence），英文缩写为AI 。它是研究、开发用于模拟、延伸和扩展人的智能的理论、方法、技术及应用系统的一门新的技术科学。一、人工智…

人工智能 2023年7月17日
0069
目标检测算法——YOLOv5/YOLOv7改进之结合MobileOne结构

>>>深度学习Tricks，第一时间送达<<< 目录 1.MobileOne: 移动端仅需1ms的高性能骨干！ 2.MobileOne bloc…

人工智能 2023年7月10日
0066
一文了解Linux内核的Oops

什么是Oops？从语言学的角度说，Oops应该是一个拟声词。当出了点小事故，或者做了比较尴尬的事之后，你可以说”Oops”，翻译成中国话就叫做”…

人工智能 2023年6月28日
00107
全网最全Linux命令总结！！（史上最全，建议收藏）

大家好，我是冰河~~ 最近家里的事情太多了，很久没更新技术文了。期间，也收到了很多小伙伴的鼓励，谢谢大家的帮助和支持，我想感谢大家最好的方式就是持续分享好的技术文章了吧，让自己和他…

人工智能 2023年6月19日
0083
趁热打铁，再构建百万节点关系中药方剂知识图谱

趁热打铁，再构建百万节点关系中药方剂知识图谱前文自顶向下构建中药知识图谱初探中，已经介绍了知识图谱和中药知识图谱构建的相关基础概念，本文将研究中药方剂数据，趁热打铁，再构建百万节…

人工智能 2023年6月1日
0082
python生成requirements.txt文件

一、什么是requirements.txt文件及作用二、怎么生成requirements.txt 文件 1、pip freeze方法（不推荐）终端使用命令： 2、pipreqs…

人工智能 2023年7月4日
0051
逻辑回归算法深度思考-优点和缺点

之前《python信用评分卡建模（附代码）》介绍了逻辑回归评分卡模型的各个细节，包括各种分箱方法，woe和iv原理和Excel保姆级推导，变量badrate单调性，坏客户定义，逻辑…

人工智能 2023年6月17日
0087
《实战》基于tensorflow搭建逻辑回归模型

本次实战，主要要学习完成，通过tesorflow搭建一个逻辑回归模型，通过逻辑回归模型，来完成Mnist数据集的分类任务。 Mnist数据集，在tensorflow中就有，需要将其…

人工智能 2023年5月24日
0061
【计算机视觉】数字图像处理（五）—— 图像的退化与复原

数字图像处理（五）—— 图像的退化与复原 * – 一、图像退化 – + 图像退化的定义： – 二、图像复原 – + （一）、图像复原…

人工智能 2023年5月28日
0074
使用K-means算法进行聚类分析

本文将介绍如何使用 K-means 算法对给定的坐标数据进行聚类分析。使用K-means算法进行聚类分析问题描述 K-means算法对data中数据进行聚类分析（1）算法原理描…

人工智能 2023年5月31日
00116
Code For Better 谷歌开发者之声 ——Tensorflow与深度学习

给大家推荐一款丧心病狂的API测试工具：Apifox。Apifox 是接口管理、开发、测试全流程集成工具，定位 Postman + Swagger + Mock + JMeter。…

人工智能 2023年6月16日
0094

2024 年 5 月
一	二	三	四	五	六	日
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31

PyTorch学习笔记（5）–mnist数据集训练

大家都在看