tensorflow +mnist

最新推荐文章于 2020-11-28 11:54:38 发布

Jemila

最新推荐文章于 2020-11-28 11:54:38 发布

阅读量1k

点赞数

本文链接：https://blog.csdn.net/Jemila/article/details/64664185

版权

python 同时被 3 个专栏收录

20 篇文章 1 订阅

订阅专栏

Machine Learning

18 篇文章 0 订阅

订阅专栏

Deep Learning

4 篇文章 0 订阅

订阅专栏

根据youtube上sendex大神视频所敲写的代码：

# -*- coding: utf-8 -*-
"""
Spyder Editor

This is a temporary script file.
"""

import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data

mnist=input_data.read_data_sets("/tmp/data",one_hot=True)

n_nodes_hl1=500
n_nodes_hl2=500
n_nodes_hl3=500

n_classes=10
batch_size=100

x=tf.placeholder('float',[None,784])#flat out the data
y=tf.placeholder('float')

def neural_network_model(data):
    hidden_1_layer={'weights':tf.Variable(tf.random_normal([784,n_nodes_hl1])),
                    'biases':tf.Variable(tf.random_normal([n_nodes_hl1]))}
    hidden_2_layer={'weights':tf.Variable(tf.random_normal([n_nodes_hl1,n_nodes_hl2])),
                    'biases':tf.Variable(tf.random_normal([n_nodes_hl2]))}
    hidden_3_layer={'weights':tf.Variable(tf.random_normal([n_nodes_hl2,n_nodes_hl3])),
                    'biases':tf.Variable(tf.random_normal([n_nodes_hl3]))}
    output_layer={'weights':tf.Variable(tf.random_normal([n_nodes_hl3,n_classes])),
                    'biases':tf.Variable(tf.random_normal([n_classes]))}
                    
    l1=tf.add(tf.matmul(data,hidden_1_layer['weights']),hidden_1_layer['biases'])
    l1=tf.nn.relu(l1)
    
    l2=tf.add(tf.matmul(l1,hidden_2_layer['weights']),hidden_2_layer['biases'])
    l2=tf.nn.relu(l2)
    
    l3=tf.add(tf.matmul(l2,hidden_3_layer['weights']),hidden_3_layer['biases'])
    l3=tf.nn.relu(l3)
    
    output=tf.matmul(l3,output_layer['weights'])+output_layer['biases']
    
    return output
    

def train_neural_network(x):
    prediction = neural_network_model(x)
    cost=tf.reduce_mean( tf.nn.softmax_cross_entropy_with_logits(logits=prediction,labels=y) )
    optimizer=tf.train.AdamOptimizer().minimize(cost)#也可以选择梯度下降法
    
    hm_epochs=10
    #所有样本处理一遍算一个epoch
    
    with tf.Session() as sess:
        sess.run(tf.initialize_all_variables())
        
        for epoch in range(hm_epochs):
            epoch_loss=0
            for _ in range(int(mnist.train.num_examples/batch_size)):
                epoch_x,epoch_y=mnist.train.next_batch(batch_size)
                _,c=sess.run([optimizer,cost],feed_dict={x:epoch_x,y:epoch_y})
                epoch_loss+=c
            print ('Epoch',epoch,'completed out of',hm_epochs,'loss',epoch_loss)
        correct=tf.equal(tf.argmax(prediction,1),tf.argmax(y,1))
        accuracy=tf.reduce_mean(tf.cast(correct,'float'))
        print ('Accuracy:',accuracy.eval({x:mnist.test.images,y:mnist.test.labels}))


train_neural_network(x)

运行结果：

Epoch 0 completed out of 10 loss 1804656.12052
Epoch 1 completed out of 10 loss 401965.048153
Epoch 2 completed out of 10 loss 217808.414017
Epoch 3 completed out of 10 loss 130326.765904
Epoch 4 completed out of 10 loss 75227.516495
Epoch 5 completed out of 10 loss 46899.7264338
Epoch 6 completed out of 10 loss 32204.3892914
Epoch 7 completed out of 10 loss 23254.3602934
Epoch 8 completed out of 10 loss 18647.4183468
Epoch 9 completed out of 10 loss 17600.1437412
Accuracy: 0.9511

另外，使用KNN准确率为0.9664,。

文中某些参数参考：

http://blog.sina.com.cn/s/blog_155d29f010102wqj6.html

http://blog.csdn.net/mao_xiao_feng/article/details/53382790

http://blog.csdn.net/freedom098/article/details/51911473

mnist数据可视化的代码参考：

https://github.com/saradhix/mnist_visual

再来一个卷积神经训练的代码：

from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets('MNIST_data', one_hot=True)

import tensorflow as tf
import pandas as pd
from PIL import Image 
import numpy as np

sess = tf.InteractiveSession()

X = tf.placeholder(tf.float32, [None, 28*28])#用于CNN样本定义 160*60
Y = tf.placeholder(tf.float32, [None, 10])#用于CNN训练类别 5*63
keep_prob = tf.placeholder(tf.float32) # dropout 用于CNN类别输出防止过拟合时的过滤器

# 定义CNN
def crack_captcha_cnn(w_alpha=0.01, b_alpha=0.1):
	x = tf.reshape(X, shape=[-1, 28, 28, 1])#四维矩阵

	w_c1 = tf.Variable(w_alpha*tf.random_normal([3, 3, 1, 32]))#每次输入三张图，3*1,32个通道单元
	b_c1 = tf.Variable(b_alpha*tf.random_normal([32]))
	conv1 = tf.nn.relu(tf.nn.bias_add(tf.nn.conv2d(x, w_c1, strides=[1, 1, 1, 1], padding='SAME'), b_c1))#same允许有边缘，因为只有两维，通常strides取[1，stride，stride，1],步长为1,
	conv1 = tf.nn.max_pool(conv1, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')#max pooling是CNN当中的最大值池化操作，其实用法和卷积很类似,两个1是atch和channel，2*2是池化窗口的大小
	conv1 = tf.nn.dropout(conv1, keep_prob)

	w_c2 = tf.Variable(w_alpha*tf.random_normal([3, 3, 32, 64]))
	b_c2 = tf.Variable(b_alpha*tf.random_normal([64]))
	conv2 = tf.nn.relu(tf.nn.bias_add(tf.nn.conv2d(conv1, w_c2, strides=[1, 1, 1, 1], padding='SAME'), b_c2))
	conv2 = tf.nn.max_pool(conv2, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')
	conv2 = tf.nn.dropout(conv2, keep_prob)

	w_d = tf.Variable(w_alpha*tf.random_normal([7*7*64, 1024]))
	b_d = tf.Variable(b_alpha*tf.random_normal([1024]))
	dense = tf.reshape(conv2, [-1, w_d.get_shape().as_list()[0]])
	dense = tf.nn.relu(tf.add(tf.matmul(dense, w_d), b_d))
	dense = tf.nn.dropout(dense, keep_prob)

	w_out = tf.Variable(w_alpha*tf.random_normal([1024, 10]))
	b_out = tf.Variable(b_alpha*tf.random_normal([10]))
	out = tf.add(tf.matmul(dense, w_out), b_out)
	out = tf.nn.softmax(out)
	return out

# 训练
output = crack_captcha_cnn()
loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(output, Y))
train_step = tf.train.AdamOptimizer(learning_rate=0.001).minimize(loss)
predict = tf.reshape(output, [-1, 1, 10])
max_idx_p = tf.argmax(predict, 2)
max_idx_l = tf.argmax(tf.reshape(Y, [-1, 1, 10]), 2)
correct_pred = tf.equal(max_idx_p, max_idx_l)
accuracy = tf.reduce_mean(tf.cast(correct_pred, tf.float32))

sess.run(tf.initialize_all_variables())
for i in range(10000):
    batch = mnist.train.next_batch(50)
    if i%100 == 0:
        #验证的时候dropout=1.0，训练时=0.5
        train_accuracy = accuracy.eval(feed_dict={X:batch[0], Y: batch[1], keep_prob: 1.0})
        print ("step %d, training accuracy %g"%(i, train_accuracy))
    train_step.run(feed_dict={X: batch[0], Y: batch[1], keep_prob: 0.5})
print ("test accuracy %g"%accuracy.eval(feed_dict={
X: mnist.test.images, Y: mnist.test.labels, keep_prob: 1.0}))

batch=mnist.test.next_batch(50)
predict = tf.argmax(tf.reshape(output, [-1, 1, 10]), 2)
text_list = sess.run(predict, feed_dict={X:batch[0], keep_prob: 1})
print("正确: {}  预测: {}".format(text_list, batch[1]))