TensorFlow自学笔记-06 基于官方文档 反向传播
import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)
n_input = 784
n_classes = 10
max_epochs = 10000
learning_rate = 0.5
batch_size = 10
seed = 0
n_hidden = 10
def sigmaprime(x):
return tf.multiply(tf.sigmoid(x), tf.subtract(tf.constant(1.0), tf.sigmoid(x)))
x_in = tf.placeholder(tf.float32, [None, n_input])
y = tf.placeholder(tf.float32, [None, n_classes])
def multilayer_perceptron(x, weights, biases):
h_layer_1 = tf.add(tf.matmul(x, weights['h1']), biases['h1'])
out_layer_1 = tf.sigmoid(h_layer_1)
h_out = tf.matmul(out_layer_1, weights['out']) + biases['out']
return tf.sigmoid(h_out), h_out, out_layer_1, h_layer_1
weights = {'h1': tf.Variable(tf.random_normal([n_input, n_hidden], seed=seed)),
'out': tf.Variable(tf.random_normal([n_hidden, n_classes], seed=seed))}
biases = {'h1': tf.Variable(tf.random_normal([1, n_hidden], seed=seed)),
'out': tf.Variable(tf.random_normal([1, n_classes], seed=seed))}
y_hat, h_2, o_1, h_1 = multilayer_perceptron(x_in, weights, biases)
err = y_hat - y
delta_2 = tf.multiply(err, sigmaprime(h_2))
delta_w_2 = tf.matmul(tf.transpose(o_1), delta_2)
wtd_error = tf.matmul(delta_2, tf.transpose(weights['out']))
delta_1 = tf.multiply(wtd_error, sigmaprime(h_1))
delta_2 = tf.matmul(tf.transpose(x_in), delta_1)
eta = tf.constant(learning_rate)
step = [tf.assign(weights['h1'], tf.subtract(weights['h1'],
tf.multiply(eta, tf.reduce_mean(delta_1, axis=[0])))),
tf.assign(weights['out'], tf.subtract(weights['out'],
tf.multiply(eta, delta_w_2))),
tf.assign(biases['out'], tf.subtract(biases['out'],
tf.multiply(eta, tf.reduce_mean(delta_2, axis=[0]))))]
acct_mat = tf.equal(tf.argmax(y_hat, 1), tf.argmax(y, 1))
accuracy = tf.reduce_sum(tf.cast(acct_mat, tf.float32))
init = tf.global_variables_initializer()
with tf.Session() as sess:
sess.run(init)
for epoch in range(max_epochs):
batch_xs, batch_ys = mnist.train.next_batch(batch_size)
sess.run(step, feed_dict={x_in: batch_xs, y: batch_ys})
if epoch % 1000 == 0:
acc_test = sess.run(accuracy, feed_dict={x_in: mnist.test.images, y: mnist.test.labels})
acc_train = sess.run(accuracy, feed_dict={x_in: mnist.train.images, y: mnist.train.labels})
print('Epoch: {0} Accuracy Train%: {1} Accuracy Teat%: {2}'.format(epoch, acc_train/600, (acc_test/100)))