pytorch实现CNN模型进行多分类(mnist)

使用的数据集:MNIST

import torch 
import numpy as np
import pandas as pd
import torch.nn as nn
import torch.nn.functional as F
import matplotlib.pyplot as plt
from torch.utils.data import Dataset
from torch.utils.data import DataLoader
from torchvision.datasets import MNIST
from torch.utils.data import random_split
from torch.utils.data import TensorDataset
import torchvision.transforms as transforms

# 定义CNN模型,如果看不懂,需要先学习CNN过程
class Net(nn.Module):
    def __init__(self):
        super(Net,self).__init__()
        self.conv1 = nn.Sequential(
            nn.Conv2d(
                in_channels=1,
                out_channels=16,
                kernel_size=5,
                stride=1,
                padding=2,
            ),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2),
        )
        self.conv2 = nn.Sequential(
            nn.Conv2d(16,32,5,1,2),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2),
        )
        self.out = nn.Linear(32 * 7 * 7,10)
        
    
    def forward(self,x):
          
        x = self.conv1(x)
        x = self.conv2(x)
        x = x.view(-1,32 * 7 * 7)
        output = self.out(x)
        return output
        

# 批处理大小
batch_size = 64
# 把数据转成tensor,并遵从正态分布
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.1307,), (0.3081,))
    ])
# 训练集
train_dataset = MNIST(root=r'C:/Users/Administrator/Desktop/data/', 
                      train=True, 
                      download=True, 
                      transform=transform)

train_loader = DataLoader(train_dataset,
                         shuffle=True,
                         batch_size=batch_size)
# 测试集
test_dataset = MNIST(root=r'C:/Users/Administrator/Desktop/data/', 
                      train=False, 
                      download=True, 
                      transform=transform)

test_loader = DataLoader(test_dataset,
                         shuffle=True,
                         batch_size=batch_size)
# 实例化模型
model = Net()

print(model)
# 使用交叉熵损失函数
criterion = nn.CrossEntropyLoss()
# 使用带有动量的随机梯度下降
optimizer = torch.optim.SGD(model.parameters(),lr=0.01,momentum=0.5)
# 用于存储损失
loss_list = []
for epoch in range(10):
    
    for batch,(X,y) in enumerate(train_loader):
        # 正向传播
        y_pred = model(X)
        # 计算损失
        loss = criterion(y_pred,y)
        # 梯度归零
        optimizer.zero_grad()
        # 反向传播
        loss.backward()
        # 更新参数
        optimizer.step()
        # 每300次看下损失
        if batch % 300 == 0:
            loss_list.append(loss.data.item())
            print("loss------------",loss.data.item())

# 显示损失下降的图像        
plt.plot(np.linspace(0,1000,len(loss_list)),loss_list)
plt.show()        
# 检验测试集的正确率
rets = []
total = 0
correct = 0
# 不需要计算梯度
with torch.no_grad():
    for data in test_loader:

        X, y = data 
        y_pred = model(X)
        # 返回值有两个,第一个是最大的值,第二个是最大值的索引
        _,predicted = torch.max(y_pred.data,dim=1)

        total += y.size(0)
        correct += (predicted == y).sum().item()

print('accuracy on test set: %.2f %% ' % (100.0*(correct/total)))

在这里插入图片描述

显示前八十个预测的结果

plt.figure(figsize=(20,20))
for i in range(80):
    plt.subplot(8,10,i+1)
    plt.xticks()
    plt.yticks()
    plt.grid(False)
    plt.imshow(test_dataset.data[i],cmap=plt.cm.binary_r)
    
    X = torch.FloatTensor(np.array(test_dataset.data[i]))
    X = X.view(1,1,28,28)
    y_pred = model(X)
    _,predicted = torch.max(y_pred.data,dim=1)
    
    if test_dataset.targets[i].data.item() == predicted.data.item():
        plt.title(test_dataset.targets[i].data.item())
    else:
        plt.title(predicted.data.item(),color='red')

plt.show()

错误的会显示红色,这里说明前80个全部预测正确了,毕竟是99.10%的正确率

在这里插入图片描述
然后简单测试下泛化能力:
我自己写了0123456789看它能不能识别
这里我截取的图的大小是28*28的
以后有空会做对图片自动切割划分
这里只是做了对图片灰度处理和二值化

在这里插入图片描述

import cv2
import numpy as np
import matplotlib.pyplot as plt

plt.figure(figsize=(20,2))
for i in range(10):
    plt.subplot(1,10,i+1)
    plt.xticks(())
    plt.yticks(())
    plt.grid(False)
    img = cv2.imread("c:/Users/Administrator/Desktop/image/"+str(i)+".png")
    plt.imshow(img)
    
plt.figure(figsize=(20,2))
for i in range(10):
    plt.subplot(1,10,i+1)
    plt.xticks(())
    plt.yticks(())
    plt.grid(False)
    img = cv2.imread("c:/Users/Administrator/Desktop/image/"+str(i)+".png")
    
    # 转成灰度图片
    img = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
    # 二值化
    ret,img = cv2.threshold(img, 155, 255, cv2.THRESH_BINARY_INV)
    # 进行预测
    X = torch.FloatTensor(np.array(img))
    X = X.view(1,1,28,28)
    y_pred = model(X)
    _,predicted = torch.max(y_pred.data,dim=1)
    if i == predicted.data.item():
        plt.title(predicted.data.item(),c='c')
    else:
        plt.title(predicted.data.item(),c='r')
    plt.imshow(img)
plt.show()

效果还行,0和9认错了

在这里插入图片描述

  • 6
    点赞
  • 32
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
以下是CNN图像分类的PyTorch代码示例: 导入必要的库: ```python import torch import torch.nn as nn import torch.optim as optim import torchvision import torchvision.transforms as transforms ``` 定义超参数: ```python device = torch.device("cuda" if torch.cuda.is_available() else "cpu") num_epochs = 5 batch_size = 4 learning_rate = 0.001 transform = transforms.Compose( [transforms.ToTensor(), transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))]) train_dataset = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform) train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True, num_workers=2) test_dataset = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform) test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=False, num_workers=2) classes = ('plane', 'car', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse', 'ship', 'truck') ``` 定义卷积神经网络: ```python class Net(nn.Module): def __init__(self): super(Net, self).__init__() self.conv1 = nn.Conv2d(3, 6, 5) self.pool = nn.MaxPool2d(2, 2) self.conv2 = nn.Conv2d(6, 16, 5) self.fc1 = nn.Linear(16 * 5 * 5, 120) self.fc2 = nn.Linear(120, 84) self.fc3 = nn.Linear(84, 10) def forward(self, x): x = self.pool(torch.relu(self.conv1(x))) x = self.pool(torch.relu(self.conv2(x))) x = x.view(-1, 16 * 5 * 5) x = torch.relu(self.fc1(x)) x = torch.relu(self.fc2(x)) x = self.fc3(x) return x net = Net().to(device) ``` 定义损失函数和优化器: ```python criterion = nn.CrossEntropyLoss() optimizer = optim.SGD(net.parameters(), lr=learning_rate, momentum=0.9) ``` 训练网络: ```python for epoch in range(num_epochs): running_loss = 0.0 for i, data in enumerate(train_loader, 0): inputs, labels = data[0].to(device), data[1].to(device) optimizer.zero_grad() outputs = net(inputs) loss = criterion(outputs, labels) loss.backward() optimizer.step() running_loss += loss.item() if i % 2000 == 1999: print('[%d, %5d] loss: %.3f' % (epoch + 1, i + 1, running_loss / 2000)) running_loss = 0.0 print('Finished Training') ``` 测试网络: ```python correct = 0 total = 0 with torch.no_grad(): for data in test_loader: images, labels = data[0].to(device), data[1].to(device) outputs = net(images) _, predicted = torch.max(outputs.data, 1) total += labels.size(0) correct += (predicted == labels).sum().item() print('Accuracy of the network on the 10000 test images: %d %%' % ( 100 * correct / total)) ``` 输出每个类别的准确率: ```python class_correct = list(0. for i in range(10)) class_total = list(0. for i in range(10)) with torch.no_grad(): for data in test_loader: images, labels = data[0].to(device), data[1].to(device) outputs = net(images) _, predicted = torch.max(outputs, 1) c = (predicted == labels).squeeze() for i in range(4): label = labels[i] class_correct[label] += c[i].item() class_total[label] += 1 for i in range(10): print('Accuracy of %5s : %2d %%' % ( classes[i], 100 * class_correct[i] / class_total[i])) ```

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值