Tensorflow-rnn(mnist分类)

最新推荐文章于 2019-04-06 10:53:09 发布

风吴痕

最新推荐文章于 2019-04-06 10:53:09 发布

阅读量1k

点赞数

本文链接：https://blog.csdn.net/wc781708249/article/details/78009470

版权

python 同时被 2 个专栏收录

95 篇文章 0 订阅

订阅专栏

tensorflow

91 篇文章 1 订阅

订阅专栏

1、多层rnn

#!/usr/bin/python3
# -*- coding:utf-8 -*-
import tensorflow as tf
import numpy as np
# from tensorflow.contrib.layers.python.layers import batch_norm
from tensorflow.contrib import rnn
from tensorflow.examples.tutorials.mnist import input_data
# from tensorflow.python.framework import ops

# ops.reset_default_graph()
"""
cnn
"""
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

# 定义一些参数
batch_size = 128
droup_out = 0.7
learn_rate = 0.001
num_steps = 100000
disp_step = 2000

n_input = 28
n_steps = 28
n_hidden = 128
n_classes = 10

with tf.Graph().as_default() as graph:
    # mnist图像大小是28x28 分成0~9 共10类
    x=tf.placeholder(tf.float32,[None,n_steps*n_input])
    y_=tf.placeholder(tf.float32,[None,n_classes])
    keep=tf.placeholder(tf.float32)

    x_img=tf.reshape(x,[-1,n_steps,n_input])

    x_img=tf.unstack(x_img,n_steps,1) # 按时间序列，即第二维将[N,n_steps, n_input] 拆分成 n_steps个[N,n_input]序列 ，数据类型 list

    lstm_cell = rnn.BasicLSTMCell(n_hidden, forget_bias=1.0)

    # 加入多层rnn核
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    # Get lstm cell output
    outputs, states = rnn.static_rnn(lstm_cell, x_img, dtype=tf.float32)

    with tf.variable_scope('output') as scope:
        w=tf.get_variable('w',[n_hidden,n_classes],tf.float32,initializer=tf.random_uniform_initializer)*0.001
        b=tf.Variable(tf.random_normal([n_classes])+0.001)
    y=tf.nn.softmax(tf.matmul(outputs[-1], w) + b)


    loss=tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_,logits=y))

    train_op=tf.train.AdamOptimizer(learn_rate).minimize(loss)

    correct_prediction = tf.equal(tf.argmax(y, 1), tf.argmax(y_, 1))
    # Calculate accuracy
    accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

sess=tf.InteractiveSession(graph=graph)

tf.global_variables_initializer().run()

for step in range(num_steps):
    batch_xs, batch_ys = mnist.train.next_batch(batch_size)
    train_op.run({x:batch_xs,y_:batch_ys,keep:droup_out})
    if step % disp_step==0:
        print("step",step,'acc',accuracy.eval({x:batch_xs,y_:batch_ys,keep:droup_out}),
              'loss',loss.eval({x:batch_xs,y_:batch_ys,keep:droup_out}))

# test acc
print('test acc',accuracy.eval({x:mnist.test.images,y_:mnist.test.labels,keep:1.}))

sess.close()

结果：
这里写图片描述

2、修改序列长度

通过下面两个参数自行修改，序列长度

n_input = 28*2
n_steps = 14

3、结合NN层

#!/usr/bin/python3
# -*- coding:utf-8 -*-
import tensorflow as tf
import numpy as np
# from tensorflow.contrib.layers.python.layers import batch_norm
from tensorflow.contrib import rnn
from tensorflow.examples.tutorials.mnist import input_data
# from tensorflow.python.framework import ops

# ops.reset_default_graph()
"""
cnn
"""
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

# 定义一些参数
batch_size = 128
droup_out = 0.7
learn_rate = 0.001
num_steps = 100000
disp_step = 2000

n_input = 28
n_steps = 28
n_hidden = 128
n_classes = 10

with tf.Graph().as_default() as graph:
    # mnist图像大小是28x28 分成0~9 共10类
    x=tf.placeholder(tf.float32,[None,n_steps*n_input])
    y_=tf.placeholder(tf.float32,[None,n_classes])
    keep=tf.placeholder(tf.float32)

    # x_img=tf.reshape(x,[-1,n_steps,n_input,1])

    w1=tf.Variable(tf.random_normal([n_steps*n_input,n_steps*14]))
    b1=tf.Variable(tf.random_normal([n_steps*14]))

    x_img=tf.nn.relu(tf.nn.bias_add(tf.matmul(x,w1),b1))

    x_img=tf.reshape(x_img,[-1,n_steps,14])

    x_img=tf.unstack(x_img,n_steps,1) # 按时间序列，即第二维将[N,n_steps, n_input] 拆分成 n_steps个[N,14]序列 ，数据类型 list

    lstm_cell = rnn.BasicLSTMCell(n_hidden, forget_bias=1.0)

    # 加入多层rnn核
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    # Get lstm cell output
    outputs, states = rnn.static_rnn(lstm_cell, x_img, dtype=tf.float32)

    with tf.variable_scope('output') as scope:
        w=tf.get_variable('w',[n_hidden,n_classes],tf.float32,initializer=tf.random_uniform_initializer)*0.001
        b=tf.Variable(tf.random_normal([n_classes])+0.001)
    y=tf.nn.softmax(tf.matmul(outputs[-1], w) + b)


    loss=tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_,logits=y))

    train_op=tf.train.AdamOptimizer(learn_rate).minimize(loss)

    correct_prediction = tf.equal(tf.argmax(y, 1), tf.argmax(y_, 1))
    # Calculate accuracy
    accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

sess=tf.InteractiveSession(graph=graph)

tf.global_variables_initializer().run()

for step in range(num_steps):
    batch_xs, batch_ys = mnist.train.next_batch(batch_size)
    train_op.run({x:batch_xs,y_:batch_ys,keep:droup_out})
    if step % disp_step==0:
        print("step",step,'acc',accuracy.eval({x:batch_xs,y_:batch_ys,keep:droup_out}),
              'loss',loss.eval({x:batch_xs,y_:batch_ys,keep:droup_out}))

# test acc
print('test acc',accuracy.eval({x:mnist.test.images,y_:mnist.test.labels,keep:1.}))

sess.close()

4、结合CNN

#!/usr/bin/python3
# -*- coding:utf-8 -*-
import tensorflow as tf
import numpy as np
# from tensorflow.contrib.layers.python.layers import batch_norm
from tensorflow.contrib import rnn
from tensorflow.examples.tutorials.mnist import input_data
# from tensorflow.python.framework import ops

# ops.reset_default_graph()
"""
cnn
"""
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

# 定义一些参数
batch_size = 128
droup_out = 0.7
learn_rate = 0.001
num_steps = 100000
disp_step = 2000

n_input = 28
n_steps = 28
n_hidden = 128
n_classes = 10

with tf.Graph().as_default() as graph:
    # mnist图像大小是28x28 分成0~9 共10类
    x=tf.placeholder(tf.float32,[None,n_steps*n_input])
    y_=tf.placeholder(tf.float32,[None,n_classes])
    keep=tf.placeholder(tf.float32)

    x_img=tf.reshape(x,[-1,n_steps,n_input,1])

    w1=tf.Variable(tf.random_normal([3,3,1,16]))
    b1=tf.Variable(tf.random_normal([16]))

    x_img=tf.nn.conv2d(x_img,w1,[1,1,1,1],padding="SAME")
    x_img=tf.nn.relu(tf.nn.bias_add(x_img,b1))
    x_img=tf.nn.max_pool(x_img,[1,2,2,1],[1,2,2,1],padding="SAME") #[n,14,14,16]

    x_img=tf.reshape(x_img,[-1,n_steps//2,14*16])

    x_img=tf.unstack(x_img,n_steps//2,1) # 按时间序列，即第二维将[N,n_steps, n_input] 拆分成 14[N,14*16]序列 ，数据类型 list

    lstm_cell = rnn.BasicLSTMCell(n_hidden, forget_bias=1.0)

    # 加入多层rnn核
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    lstm_cell = rnn.MultiRNNCell([lstm_cell] * 1, state_is_tuple=True)
    # Get lstm cell output
    outputs, states = rnn.static_rnn(lstm_cell, x_img, dtype=tf.float32)

    with tf.variable_scope('output') as scope:
        w=tf.get_variable('w',[n_hidden,n_classes],tf.float32,initializer=tf.random_uniform_initializer)*0.001
        b=tf.Variable(tf.random_normal([n_classes])+0.001)
    y=tf.nn.softmax(tf.matmul(outputs[-1], w) + b)


    loss=tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_,logits=y))

    train_op=tf.train.AdamOptimizer(learn_rate).minimize(loss)

    correct_prediction = tf.equal(tf.argmax(y, 1), tf.argmax(y_, 1))
    # Calculate accuracy
    accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

sess=tf.InteractiveSession(graph=graph)

tf.global_variables_initializer().run()

for step in range(num_steps):
    batch_xs, batch_ys = mnist.train.next_batch(batch_size)
    train_op.run({x:batch_xs,y_:batch_ys,keep:droup_out})
    if step % disp_step==0:
        print("step",step,'acc',accuracy.eval({x:batch_xs,y_:batch_ys,keep:droup_out}),
              'loss',loss.eval({x:batch_xs,y_:batch_ys,keep:droup_out}))

# test acc
print('test acc',accuracy.eval({x:mnist.test.images,y_:mnist.test.labels,keep:1.}))

sess.close()

注：该方法其实可以达到去除全连接层，即在使用CNN卷积时，可以使用rnn替换全连接层
另一种去除全连接层方法，只使用CNN层，不使用全连接层
如：【n,28,28,1】->[n,14,14,32]->[n,7,7,64]->[n,3,3,128]->[n,1,1,10]->[n,10]
这样最后一层其实就相当于全连接层

风吴痕

关注

0
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
Tensorflow-rnn(mnist分类)

1、多层rnn#!/usr/bin/python3# -*- coding:utf-8 -*-import tensorflow as tfimport numpy as np# from tensorflow.contrib.layers.python.layers import batch_normfrom tensorflow.contrib import rnnfrom tens
复制链接

扫一扫