基于TensorFlow实现卷积神经网络完成手写数字识别

最新推荐文章于 2022-12-18 15:07:17 发布

-HuangYuliang-

最新推荐文章于 2022-12-18 15:07:17 发布

阅读量695

点赞数 1

分类专栏：基础算法文章标签： TensorFlow 手写数字识别卷积神经网络

本文链接：https://blog.csdn.net/Huangyuliang1992/article/details/80291768

版权

基础算法专栏收录该内容

4 篇文章 0 订阅

订阅专栏

手写数字识别是学习卷积神经网络的经典算例，本文用TensorFlow搭建了一个卷积神经网络。结构如下：

输入：28*28的一张图片A；

第一个卷积：32个5*5的卷积核，对图片A进行卷积，并经过relu激活函数，得到32张28*28的图片B；

第一个池化层：2*2的窗口，步长为2，得到32张14*14的图片C；

第二个卷积：64个5*5的卷积核，对32张14*14的图片进行卷积，并经过relu激活函数，得到64张14*14的图片D；

第二个池化层：2*2的窗口，步长为2，得到64张7*7的图片E；

第一个全连接层：1024个神经元，输入层是7*7*64个神经元，即7*7*64--1024，采用relu激活函数

第二个全连接层：10个神经元，即1024--10，采用softmax激活函数

import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data
# 载入数据集
mnist = input_data.read_data_sets(r'D:\Workspase\kaggle\z_data_sets',one_hot=True)
# 每个批次的大小
batch_size = 100
n_batch = mnist.train.num_examples // batch_size

# 初始化权值
def weight_variable(shape):
    initial = tf.truncated_normal(shape,stddev=0.1)
    return tf.Variable(initial)
# 初始化偏置
def bias_variable(shape):
    initial = tf.constant(0.1,shape=shape)
    return tf.Variable(initial)
# 卷积层
def conv2d(x,W):
    # x = [batch,in_height,in_width,in_channels][批次，长，宽，通道数]
    # W = 卷积核 [filter_height,filter_width,in_channels,out_channels]
    # strides[0]=strides[1],strides[1]代表x方向的步长，strides[2]代表y方向的步长
    # padding : A string from :'SAME','VALID'
    return tf.nn.conv2d(x,W,strides=[1,1,1,1],padding='SAME')
# 池化层
def max_pool_2x2(x):
    # ksize [1,x,y,1],x,y 代表窗口的大小
    return tf.nn.max_pool(x,ksize=[1,2,2,1],strides=[1,2,2,1],padding='SAME')

x = tf.placeholder(tf.float32,[None,784]) #28*28
y = tf.placeholder(tf.float32,[None,10])
# 改变 x 的格式，转为4D的向量[batch,in_height,in_width,in_channels]
x_image = tf.reshape(x,[-1,28,28,1]) # -1代表批次的大小
# 初始化第一个卷积层的权重和偏置
W_conv1 = weight_variable([5,5,1,32]) # 5*5的采样窗口，1：通道数，32个卷积核从1个平面抽取特征得到32个平面
b_conv1 = bias_variable([32])
# 把x_image和权值向量进行卷积，再加上偏置值，然后应用于relu激活函数
h_conv1 = tf.nn.relu(conv2d(x_image,W_conv1)+b_conv1)
h_pool1 = max_pool_2x2(h_conv1)  # 进行max_pooling
# 初始化第二个卷积层的权值和偏置
W_conv2 = weight_variable([5,5,32,64]) # 5*5的采样窗口，1：通道数，64个卷积核从32个平面抽取特征得到64个平面
b_conv2 = bias_variable([64])
# 把x_image和权值向量进行卷积，再加上偏置值，然后应用于relu激活函数
h_conv2 = tf.nn.relu(conv2d(h_pool1,W_conv2)+b_conv2)
h_pool2 = max_pool_2x2(h_conv2)  # 进行max_pooling

# 28*28的图片第一次卷积后还是28*28，第一次池化后14*14
# 第二次卷积后14*14，第二次池化后7*7
# 经过上面操作后得到64张7*7的平面
# 初始化第一个全连接层的权值
W_fc1 = weight_variable([7*7*64,1024]) #上一层有7*7*64个神经元，全连接层有1024个神经元
b_fc1 = bias_variable([1024]) # 1024个节点
# 把池化层2的输出扁平化为1维
h_pool2_flat = tf.reshape(h_pool2,[-1,7*7*64]) # -1表示任意值，这里是100
# 求第一个全连接层的输出
h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat,W_fc1)+b_fc1)
# keep_prob用来表示激活神经元的比例
keep_prob = tf.placeholder(tf.float32)
h_fc1_drop = tf.nn.dropout(h_fc1,keep_prob)
# 初始化第二个全连接层
W_fc2 = weight_variable([1024,10]) #上一层有7*7*64个神经元，全连接层有1024个神经元
b_fc2 = bias_variable([10]) # 1024个节点
# 计算输出
prediction = tf.nn.softmax(tf.matmul(h_fc1_drop,W_fc2)+b_fc2)
# 交叉熵代价函数
cross_entropy = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y,logits=prediction))
# 使用AdamOptimizer进行优化
train_step = tf.train.AdamOptimizer(1e-4).minimize(cross_entropy)
# 结果存放在一个布尔列表中
correct_prediction = tf.equal(tf.argmax(prediction,1),tf.argmax(y,1))
# 求准确率
accuracy = tf.reduce_mean(tf.cast(correct_prediction,tf.float32))
with tf.Session() as sess:
    sess.run(tf.global_variables_initializer())
    for epoch in range(21):
        print(str(epoch))
        for batch in range(n_batch):
            
            batch_xs,batch_ys = mnist.train.next_batch(batch_size)      
            sess.run(train_step,feed_dict={x:batch_xs,y:batch_ys,keep_prob:0.7})
        
        for i in range(2):
            testSet = mnist.test.next_batch(1000)          
            print("test accuracy %g"%accuracy.eval(feed_dict={ x: testSet[0], y: testSet[1], keep_prob: 1.0}))

结果：

0
test accuracy 0.859
test accuracy 0.872
1
test accuracy 0.979
test accuracy 0.967
2
test accuracy 0.98
test accuracy 0.976
3
test accuracy 0.985
test accuracy 0.986
4
test accuracy 0.982
test accuracy 0.99
5
test accuracy 0.979
test accuracy 0.99
6
test accuracy 0.989
test accuracy 0.988
7
test accuracy 0.981
test accuracy 0.991
8
test accuracy 0.981
test accuracy 0.988
9
test accuracy 0.991
test accuracy 0.989
10
test accuracy 0.989
test accuracy 0.986
11
test accuracy 0.994
test accuracy 0.987
12
test accuracy 0.994
test accuracy 0.992
13
test accuracy 0.99
test accuracy 0.99
14
test accuracy 0.989
test accuracy 0.994
15
test accuracy 0.989
test accuracy 0.99
16
test accuracy 0.986
test accuracy 0.993
17
test accuracy 0.989
test accuracy 0.994
18
test accuracy 0.992
test accuracy 0.991
19
test accuracy 0.989
test accuracy 0.991
20
test accuracy 0.994
test accuracy 0.99