TensorFlow 实战Google深度学习框架（第2版）第6章之LeNet-5模型实现MNIST数字识别

最新推荐文章于 2024-07-25 23:06:58 发布

大笨牛@

最新推荐文章于 2024-07-25 23:06:58 发布

阅读量250

点赞数

文章标签：深度学习 tensorflow 神经网络

本文链接：https://blog.csdn.net/Graduate2015/article/details/111234705

版权

本篇为记录楼主在学习《TensorFlow 实战Google深度学习框架（第2版）》第6章利用LeNet-5模型实现MNIST数字识别过程中遇到的一些问题的记录、汇总。

mnist_train_cnn.py程序的输入数据格式应做调整。主要有两处：

这里，在使用tf.placeholder时要指明张量第一维的长度，即shape里第一位不能像之前一样为None，否则会报错“Failed to convert object of type <class ‘list’> to Tensor. Contents: [None, 3136]. Consider casting ”。

    x = tf.placeholder(tf.float32, 
                       [BATCH_SIZE, 
                        mnist_inference_cnn.IMAGE_SIZE, 
                        mnist_inference_cnn.IMAGE_SIZE, 
                        mnist_inference_cnn.NUM_CHANNELS],
                      name = "x-input")
    y_ = tf.placeholder(tf.float32, 
                        [BATCH_SIZE, 
                         mnist_inference_cnn.NUM_LABELS],name = "y-input")

这里，不能使用tf.reshape来调整数据格式，而应该使用np.reshape，即numpy里面的reshape命令，否则会报错“typeError:The value of a feed cannot be a tf.Tensor object.Acceptable feed values include Python scalars,strings,lists.numpy ndarrays,or TensorHandles.For reference.the tensor object was Tensor…”。这里的错误信息解释得很清楚。所以，我们需要用np.reshape，这样结果就不是一个tensor。

reshaped_xs = np.reshape(xs,
                         [BATCH_SIZE, 
                         mnist_inference_cnn.IMAGE_SIZE, 
                         mnist_inference_cnn.IMAGE_SIZE, 
                         mnist_inference_cnn.NUM_CHANNELS])

下面给出了完整的训练代码：

# _*_ coding:utf-8 _*_

import tensorflow as tf

IMAGE_SIZE = 28
NUM_CHANNELS = 1
NUM_LABELS = 10

# 第一层卷积层的尺寸和深度
CONV1_SIZE = 5
CONV1_DEEP = 32

# 第二层卷积层的尺寸和深度
CONV2_SIZE = 5
CONV2_DEEP = 64

# 全连接层的节点个数
FC_SIZE = 512

def inference(input_tensor,train, regularizer):
    
    # 第一层：卷积层。过滤器或内核的尺寸为5*5，深度为32，步长为1，使用全0填充
    # 输入：BATCH_SIZE*28*28*1的张量
    # 输出：BATCH_SIZE*28*28*32的张量
    with tf.variable_scope("layer1-conv1"):
        conv1_weight = tf.get_variable("weight",[CONV1_SIZE, CONV1_SIZE, NUM_CHANNELS, CONV1_DEEP], 
                                       initializer = tf.truncated_normal_initializer(stddev=0.1))
        conv1_bias = tf.get_variable("bias",[CONV1_DEEP], initializer = tf.constant_initializer(0.0))
        conv1 = tf.nn.conv2d(input_tensor, conv1_weight, strides = [1,1,1,1], padding="SAME")
        relu1 = tf.nn.relu(tf.nn.bias_add(conv1, conv1_bias))
       
    # 第二层：池化层。过滤器的尺寸为2*2，步长为2
    # 输入：BATCH_SIZE*28828*32的张量
    # 输出：BATCH_SIZE*14*14*32的张量
    with tf.variable_scope("layer2-pool1"):
        pool1 = tf.nn.max_pool(relu1, ksize=[1,2,2,1], strides = [1,2,2,1],padding="SAME")
        
    # 第三层：卷积层。过滤器或内核的尺寸为5*5，深度为64，步长为1，使用全0填充
    # 输入：BATCH_SIZE*14*14*32的张量
    # 输出：BATCH_SIZE*14*14*64的张量
    with tf.variable_scope("layer3-conv2"):
        conv2_weight = tf.get_variable("weight", [CONV2_SIZE, CONV2_SIZE, CONV1_DEEP, CONV2_DEEP],
                                      initializer = tf.truncated_normal_initializer(stddev=0.1))
        conv2_bias = tf.get_variable("bias", [CONV2_DEEP], initializer = tf.constant_initializer(0.0))
        conv2 = tf.nn.conv2d(pool1, conv2_weight, strides = [1,1,1,1], padding="SAME")
        relu2 = tf.nn.relu(tf.nn.bias_add(conv2, conv2_bias))   
        
    # 第四层：池化层。过滤器的尺寸为2，步长为2
    # 输入：BATCH_SIZE*14*14*64的张量
    # 输出：BATCH_SIZE*7*7*64的张量
    with tf.variable_scope("layer4-pool2"):
        pool2 = tf.nn.max_pool(relu2, ksize = [1,2,2,1], strides = [1,2,2,1], padding="SAME")
        
    # 将BATCH_SIZE*7*7*64的四维张量重新组织为BATCH_SIZE*3136的二维张量
    pool_shape = pool2.get_shape().as_list()
    nodes = pool_shape[1]*pool_shape[2]*pool_shape[3]
    reshaped = tf.reshape(pool2,[pool_shape[0],nodes])
    
    # 第五层：全连接层
    # 输入：BATCH_SIZE*3136的张量
    # 输出：BATCH_SIZE*512的张量
    with tf.variable_scope("layer5-cf1"):
        fc1_weight = tf.get_variable("weight", [nodes, FC_SIZE], 
                                     initializer = tf.truncated_normal_initializer(stddev=0.1))
        fc1_bias = tf.get_variable("bias",[FC_SIZE], initializer = tf.constant_initializer(0.1))
        fc1 = tf.nn.relu(tf.matmul(reshaped, fc1_weight)+fc1_bias)
        if regularizer != None:
            tf.add_to_collection("losses", regularizer(fc1_weight))
        if train: 
            fc1 = tf.nn.dropout(fc1,0.5)
        
    # 第六层：全连接层
    # 输入：BATCH_SIZE*512的张量
    # 输出：BATCH_SIZE*10的张量
    with tf.variable_scope("layer6-cf2"):
        fc2_weight = tf.get_variable("weight", [FC_SIZE, NUM_LABELS], 
                                     initializer = tf.truncated_normal_initializer(stddev=0.1))
        fc2_bias = tf.get_variable("bias", [NUM_LABELS], initializer = tf.constant_initializer(0.1))
        fc2 = tf.matmul(fc1, fc2_weight) + fc2_bias
        if regularizer != None:
            tf.add_to_collection("losses", regularizer(fc2_weight))
        
    return fc2

# _*_ coding: utf-8 _*_

import os
import tensorflow as tf
import numpy as np
from tensorflow.examples.tutorials.mnist import input_data

import mnist_inference_cnn

BATCH_SIZE = 100
LEARNING_RATE_BASE = 0.8
LEARNING_RATE_DECAY = 0.99
REGULARIZATION_RATE = 0.001
MOVING_AVERAGE_DECAY = 0.99
TRAINING_STEPS = 30000

# 模型保存的路径和文件名
MODEL_SAVE_PATH = "/path" # 替换成自己的路径
MODEL_NAME = "model.ckpt"

def train(mnist):
    
    x = tf.placeholder(tf.float32, 
                       [BATCH_SIZE, 
                        mnist_inference_cnn.IMAGE_SIZE, 
                        mnist_inference_cnn.IMAGE_SIZE, 
                        mnist_inference_cnn.NUM_CHANNELS],
                        name = "x-input")
    y_ = tf.placeholder(tf.float32, 
                        [BATCH_SIZE, 
                         mnist_inference_cnn.NUM_LABELS],name = "y-input")
    
    regularizer = tf.contrib.layers.l2_regularizer(REGULARIZATION_RATE)
    
    # 前向传播，使用dropout
    y = mnist_inference_cnn.inference(x, 1, regularizer)
    
    global_step = tf.Variable(0, trainable=False)
    
    # 计算cross-entropy和loss
    cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(logits = y, labels = tf.argmax(y_,1))
    cross_entropy_mean = tf.reduce_mean(cross_entropy)
    loss = cross_entropy_mean + tf.add_n(tf.get_collection("losses"))                                                                
    
    # 设置滑动平均
    variables_average_op = tf.train.ExponentialMovingAverage(MOVING_AVERAGE_DECAY,global_step).apply(tf.trainable_variables())
    
    # 反向传播
    learning_rate = tf.train.exponential_decay(LEARNING_RATE_BASE, 
                                               global_step, 
                                               mnist.train.num_examples / BATCH_SIZE, 
                                               LEARNING_RATE_DECAY, 
                                               staircase = True)
    train_step = tf.train.GradientDescentOptimizer(learning_rate).minimize(loss, global_step=global_step)
    train_op = tf.group(train_step, variables_average_op)
    
    saver = tf.train.Saver()
    with tf.Session() as sess:
        
        init_op = tf.global_variables_initializer()
        sess.run(init_op)
        
        for i in range(TRAINING_STEPS):
            xs, ys = mnist.train.next_batch(BATCH_SIZE)
            reshaped_xs = np.reshape(xs,
                                     [BATCH_SIZE, 
                                      mnist_inference_cnn.IMAGE_SIZE, 
                                      mnist_inference_cnn.IMAGE_SIZE, 
                                      mnist_inference_cnn.NUM_CHANNELS])
            
            _, loss_value, step = sess.run([train_op, loss, global_step], feed_dict={x:reshaped_xs, y_:ys})
            
            # 每1000轮保存一次模型
            if i % 1000 == 0:            
                # 输出当前的训练情况
                print("%d 轮训练后，训练batch上的损失为%g" % (step, loss_value))
                
                # 保存当前的模型
                saver.save(sess, os.path.join(MODEL_SAVE_PATH, MODEL_NAME), global_step = global_step)
    

def main(argv=None):
    mnist = input_data.read_data_sets("/path", one_hot = True) # 替换成自己的路径
    train(mnist)
    
if __name__ == "__main__":
    tf.app.run()

大笨牛@

关注

0
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
TensorFlow 实战Google深度学习框架（第2版）第6章之LeNet-5模型实现MNIST数字识别

本篇为记录楼主在学习《TensorFlow 实战Google深度学习框架（第2版）》第6章利用LeNet-5模型实现MNIST数字识别过程中遇到的一些问题的记录、汇总。mnist_train_cnn.py程序的输入数据格式应做调整。主要有两处：这里，在使用tf.placeholder时要指明张量第一维的长度，即shape里第一位不能像之前一样为None，否则会报错“Failed to convert object of type <class ‘list’> to Tensor. Co
复制链接

扫一扫