當前位置：首頁 > 编程语言 > python >内容正文

python

python cnn_使用python中pytorch库实现cnn对mnist的识别

發布時間：2025/3/19 python 24 豆豆

生活随笔收集整理的這篇文章主要介紹了 python cnn_使用python中pytorch库实现cnn对mnist的识别小編覺得挺不錯的,現在分享給大家,幫大家做個參考.

使用python中pytorch庫實現cnn對mnist的識別

1 環境：Anaconda3 64bit https://www.anaconda.com/download/

2 環境：pycharm 社區免費版 https://www.jetbrains.com/pycharm/download/#section=windows?下載安裝完需要指定上面anaconda的python解釋器為pycharm的python解釋器

3 環境：pytorch，https://zhuanlan.zhihu.com/p/26871672 中離線安裝方式(下載類似于pytorch-0.1.12-py36_0.1.12cu80.tar.bz2的文件)

4 環境：Conda install torchvision

5 下載數據，直接用代碼下載太慢了，用迅雷下載了mnist

6 將數據轉換成torch可用的格式

7 訓練與測試

data.py

import os

from skimage import io

import torchvision.datasets.mnist as mnist

"""

數據集下載地址

http://yann.lecun.com/exdb/mnist/

手動下載數據集解壓檢查文件名和下面幾行代碼中的文件名是否一致

然后啟動本代碼

"""

# 下載的數據所在目錄

# F:/!BiliBili/!Py/AI/cnn_bili/mnist_data/train-images-idx3-ubyte

# F:/!BiliBili/!Py/AI/cnn_bili/mnist_data/train-labels-idx1-ubyte

# F:/!BiliBili/!Py/AI/cnn_bili/mnist_data/t10k-images-idx3-ubyte

# F:/!BiliBili/!Py/AI/cnn_bili/mnist_data/t10k-labels-idx1-ubyte

root = "F:/!BiliBili/!Py/AI/cnn_bili/mnist_data/"

# 哪個文件是訓練特征(圖) 訓練標號(是幾)

train_set = (

mnist.read_image_file(os.path.join(root, 'train-images-idx3-ubyte')),

mnist.read_label_file(os.path.join(root, 'train-labels-idx1-ubyte'))

)

# 哪個文件是測試特征測試標號

test_set = (

mnist.read_image_file(os.path.join(root, 't10k-images-idx3-ubyte')),

mnist.read_label_file(os.path.join(root, 't10k-labels-idx1-ubyte'))

)

# 打印出有多少訓練數據多少測試數據

print("training set :", train_set[0].size())

print("test set :", test_set[0].size())

# 從原始數據到 jpg圖片順便裝到文件夾里面

def convert_to_img(train=True):

if train: ?# 如果是訓練數據

# 注意這里路徑的寫法，對就是/符號

f = open(root+'train.txt', 'w')

data_path = root+'/train/' ?# 好像可以刪去左邊的/

# 如果不存在就新建 F:/!BiliBili/!Py/AI/cnn_bili/mnist_data//train/

if not os.path.exists(data_path):

os.makedirs(data_path)

# enumerate將可遍歷對象組合成索引可加參數start=2 索引從2開始

for i, (img, label) in enumerate(zip(train_set[0], train_set[1])):

img_path = data_path+str(i)+'.jpg'

# 保存圖片

io.imsave(img_path, img.numpy())

# 保存標號文件路徑和標號

f.write(img_path+' '+str(label)+'\n')

f.close()

else: ?# 如果是測試數據

f = open(root + 'test.txt', 'w')

data_path = root + '/test/'

if not os.path.exists(data_path):

os.makedirs(data_path)

for i, (img, label) in enumerate(zip(test_set[0], test_set[1])):

img_path = data_path + str(i) + '.jpg'

io.imsave(img_path, img.numpy())

f.write(img_path + ' ' + str(label) + '\n')

f.close()

print("Building training set...")

convert_to_img(True)

print("Building test set...")

convert_to_img(False)

read_cnn.py

import torch

from torch.autograd import Variable

from torchvision import transforms

from torch.utils.data import Dataset, DataLoader

from PIL import Image

root = "F:/!BiliBili/!Py/AI/cnn_bili/mnist_data/"

# -----------------準備數據--------------------------

def default_loader(path):

return Image.open(path).convert('RGB')

class MyDataset(Dataset):

# txt是路徑和文件名

def __init__(self, txt, transform=transforms.ToTensor(), target_transform=None, loader=default_loader):

fh = open(txt, 'r') ?# 只讀打開

imgs = []

for line in fh:

line = line.strip('\n') ?# 刪除回車

line = line.rstrip() ?# 刪除右側空格

words = line.split() ?# 分割：就兩列，0列是路徑 1列是標號

imgs.append((words[0], int(words[1])))

self.imgs = imgs

self.transform = transform

self.target_transform = target_transform

self.loader = loader ?# 是個函數

# train_loader里面的

def __getitem__(self, index):

fn, label = self.imgs[index] ?# fn是完整路徑 label是標號

img = self.loader(fn) ?# 調用上面的default_loader(path) 按照路徑讀取圖片

if self.transform is not None:

img = self.transform(img) ?# 將圖片轉換成FloatTensor類型

return img, label

def __len__(self):

return len(self.imgs)

# -----------------創建網絡并訓練------------------------

class Net(torch.nn.Module):

def __init__(self):

super(Net, self).__init__()

self.conv1 = torch.nn.Sequential(

# 3通道進 32出卷積核大小為3*3 卷積核步長1*1 ?(其實輸入是黑白圖)

# (self, in_channels, out_channels, kernel_size, stride=1, padding=0, dilation=1, groups=1, bias=True)

torch.nn.Conv2d(3, 32, kernel_size=(3, 3), stride=(1, 1)),

# 激活函數

# (self, inplace=False)

torch.nn.ReLU(),

# 2*2方形最大值降(下)采樣(池化) 步長2*2 膨脹1*1(不膨脹)

# (self, kernel_size, stride=None, padding=0, dilation=1, return_indices=False, ceil_mode=False)

torch.nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2), dilation=(1, 1)) ?# dilation膨脹

)

self.conv2 = torch.nn.Sequential(

torch.nn.Conv2d(32, 64, 3, 1, 1),

torch.nn.ReLU(),

torch.nn.MaxPool2d(2)

)

self.conv3 = torch.nn.Sequential(

torch.nn.Conv2d(64, 64, 3, 1, 1),

torch.nn.ReLU(),

torch.nn.MaxPool2d(2)

)

self.dense = torch.nn.Sequential(

# 線性分類器 64*3*3的輸入 128的輸出

torch.nn.Linear(64 * 3 * 3, 128),

torch.nn.ReLU(),

# 線性分類器 128的輸入 10的輸出

torch.nn.Linear(128, 10)

)

# 前向計算輸入x

def forward(self, x):

# 第一層的輸出是x經過conv1的結果

conv1_out = self.conv1(x)

# 第二層的輸出是第一層的輸出經過conv2的結果

conv2_out = self.conv2(conv1_out)

# 第三層的輸出是第二層的輸出經過conv3的結果

conv3_out = self.conv3(conv2_out)

res = conv3_out.view(conv3_out.size(0), -1)

return self.dense(res) ?# dense稠密

def read_cnn():

print("Reading train_data...")

train_data = MyDataset(txt=root + 'train.txt', transform=transforms.ToTensor())

# from torch.utils.data import Dataset, DataLoader 下面的函數在這里

train_loader = DataLoader(dataset=train_data, batch_size=50, shuffle=True)

print("Reading test_data...")

test_data = MyDataset(txt=root + 'test.txt', transform=transforms.ToTensor())

test_loader = DataLoader(dataset=test_data, batch_size=50)

# GPU or CPU

if torch.cuda.is_available():

is_cuda = True

print("work on GPU")

else:

is_cuda = False

print("work on CPU")

print("Setup Net...")

# =============================cuda()=======================

if is_cuda:

model = Net().cuda()

else:

model = Net()

# 打印網絡結構

print(model)

# Adam 一種隨機優化方法

optimizer = torch.optim.Adam(model.parameters())

# 一種優化多類分類不平衡訓練集的方法

loss_func = torch.nn.CrossEntropyLoss()

for epoch in range(3): ?# 訓練幾次停止

print('epoch {}'.format(epoch + 1))

# 訓練-----------------------------

train_loss = 0.

train_acc = 0.

for batch_x, batch_y in train_loader: ?# 特征標號

# =============================cuda()=======================

if is_cuda:

batch_x, batch_y = Variable(batch_x).cuda(), Variable(batch_y).cuda()

else:

batch_x, batch_y = Variable(batch_x), Variable(batch_y)

out = model(batch_x) ?# batch_x通過網絡的結果是out

loss = loss_func(out, batch_y) ?# 網絡結果out和實際batch_y對比的得到損失

train_loss += loss.data[0] ?# 累加訓練損失

# =============================cuda()=======================

if is_cuda:

pred = torch.max(out, 1)[1].cuda() ?# 取 out和1 的最大值?

else:

pred = torch.max(out, 1)[1] ?# 取 out和1 的最大值?

train_correct = (pred == batch_y).sum() ?# 多少個對的

train_acc += train_correct.data[0] ?# 累加訓練正確的數量？

optimizer.zero_grad() ?# 清除所有優化的grad

loss.backward() ?# 誤差反向傳遞

optimizer.step() ?# 單次優化

# 數據量大的時候小數點后6位可能不夠

# print('Train Loss: {:.6f}, Acc: {:.6f}'.format(train_loss / (len(train_data)), train_acc / (len(train_data))))

print('Train Acc: {:.6f}'.format(train_acc / (len(train_data))))

# 測試評估--------------------------------

model.eval() ?# 將網絡設置到測試評估模式，會影響網絡的Dropout和BatchNorm

eval_loss = 0.

eval_acc = 0.

for batch_x, batch_y in test_loader: ?# 特征標號

# =============================cuda()=======================

if is_cuda:

batch_x, batch_y = Variable(batch_x, volatile=True).cuda(), Variable(batch_y, volatile=True).cuda()

else:

batch_x, batch_y = Variable(batch_x, volatile=True), Variable(batch_y, volatile=True)

out = model(batch_x)

loss = loss_func(out, batch_y)

eval_loss += loss.data[0]

# =============================cuda()=======================

if is_cuda:

pred = torch.max(out, 1)[1].cuda()

else:

pred = torch.max(out, 1)[1]

num_correct = (pred == batch_y).sum()

eval_acc += num_correct.data[0]

# print('Test Loss: {:.6f}, Acc: {:.6f}'.format(eval_loss / (len(test_data)), eval_acc / (len(test_data))))

print('Test Acc: {:.6f}'.format(eval_acc / (len(test_data))))

if __name__ == '__main__':

read_cnn()

本文說實話不適合小白來讀，應該是了解了相關知識的人才能夠從中獲得一些幫助吧輸出

總結

以上是生活随笔為你收集整理的python cnn_使用python中pytorch库实现cnn对mnist的识别的全部內容，希望文章能夠幫你解決所遇到的問題。

如果覺得生活随笔網站內容還不錯，歡迎將生活随笔推薦給好友。

上一篇： python爬虫获取方法_小白学pyth
下一篇：解决高并发的问题python_pytho

3atv精品不卡视频,97人人超碰国产精品最新,中文字幕av一区二区三区人妻少妇,久久久精品波多野结衣,日韩一区二区三区精品

python

python cnn_使用python中pytorch库实现cnn对mnist的识别

總結