手写数字识别——BP神经网络实现

最新推荐文章于 2022-03-10 16:14:39 发布

花飞雨追

最新推荐文章于 2022-03-10 16:14:39 发布

阅读量217

点赞数 1

分类专栏：机器学习文章标签：深度学习机器学习

本文链接：https://blog.csdn.net/qq_36258516/article/details/109196670

版权

机器学习专栏收录该内容

8 篇文章 0 订阅

订阅专栏

手写数字识别——BP神经网络实现

贴个代码，数据集是mnist，可以直接去官网下载。

#main.py
import os
from load_file import load_mnist
from neuralNetwork import neuralNetwork

if __name__ == '__main__':
    train_images_data, train_labels = load_mnist(os.getcwd(), kind='train')
    test_images_data, test_labels = load_mnist(os.getcwd(), kind='t10k')

    learningrate = 0.1
    ls = [28*28, 30, 10]
    Network = neuralNetwork(2, ls, learningrate)

    for i in range(10):
        if i%5 == 0:  Network.learningrate /= 2
        for j in range(len(train_images_data)):
            print("第" + str(i) + "轮" + "-------正在进行训练-------" + str(j))
            Network.update(train_images_data[j], train_labels[j])

    count = 0
    for i in range(len(test_images_data)):
        print('-------正在进行测试--------')
        if Network.test(test_images_data[i], test_labels[i]): count += 1

    print(count / len(test_labels))

#neuralNetwork.py
import numpy as np
from activateFunction import activate_function

class neuralNetwork:
    def __init__(self, numNeuralLayers, numNeurons_perLayer, learningrate):
        self.numBeuralLayers = numNeuralLayers
        self.numNeurons_perLayer = numNeurons_perLayer
        self.learningrate = learningrate
        self.W = []

        for i in range(self.numBeuralLayers):
            #高斯分布进行初始化
            self.W.append(np.random.randn(numNeurons_perLayer[i + 1], numNeurons_perLayer[i])  / np.sqrt(numNeurons_perLayer[i]))

    def update(self, inputs, targets):
        inputs = np.array(inputs, ndmin = 2).T
        targets = np.array(targets, ndmin = 2).T

        outputs = []
        outputs.append(inputs)

    #前向传播
        for i in range(self.numBeuralLayers):
            a = np.dot(self.W[i], outputs[i])
            z = activate_function(a)
            outputs.append(z)

    #计算损失
        self.loss = []
        for i in range(self.numBeuralLayers):
            if i == 0:
                self.loss.append(targets - outputs[-1])
            else:
                self.loss.append(np.dot(self.W[self.numBeuralLayers - i].T, self.loss[i - 1]))

    #反向传播
        for i in range(self.numBeuralLayers):
            self.W[self.numBeuralLayers - i - 1] += self.learningrate * np.dot(self.loss[i] * outputs[self.numBeuralLayers - i] * (1 -outputs[self.numBeuralLayers -i]),
                                                                                outputs[self.numBeuralLayers - i - 1].T)

    #测试
    def test(self, test_inputs, test_targets):
        inputs = test_inputs.T

        for i in range(self.numBeuralLayers):
            a = np.dot(self.W[i], inputs)
            z = activate_function(a)
            inputs = z

        return list(inputs).index(max(list(inputs))) == list(test_targets).index(1)

#activateFunction.py
import numpy as np

def activate_function(x):
    #sigmoid
    return 1.0 / (1.0 + np.exp(-x))

#load_file.py
import os
import struct
import numpy as np

def load_mnist(path, kind = 'train'):
    labels_path = os.path.join(path, '%s-labels.idx1-ubyte'% kind)
    images_path = os.path.join(path, '%s-images.idx3-ubyte'% kind)

    with open(labels_path, 'rb') as lbpath:
        magic, n = struct.unpack('>II',lbpath.read(8))
        labels = np.fromfile(lbpath, dtype = np.uint8)
    with open(images_path, 'rb') as imgpath:
        magic, num, rows, cols = struct.unpack('>IIII', imgpath.read(16))
        images = np.fromfile(imgpath,dtype = np.uint8).reshape(len(labels), 784)

        ls = []
        for i in range(labels.size):
            temp = np.zeros(10)
            temp[labels[i]] = 1
            ls.append(temp.T)

        labels = np.array(ls)

        return (images / 2550), labels