全文参考地址:
https://github.com/jikexueyuanwiki/tensorflow-zh/blob/130a43845711cfad8e7d46e75300558349b36b57/SOURCE/tutorials/mnist_beginners.md
修改部分为input_data代码(该文件用于提供Minst的下载和导入),本身该程序提供自动下载功能,可是一直不成功,之后只能手动下载,下载之后将文件放入当前目录的MINST_data文件夹下。修改代码如下(就只修改了read_data_sets函数):
def read_data_sets(train_dir, fake_data=False, one_hot=False, dtype=tf.float32):
class DataSets(object):
pass
data_sets = DataSets()
if fake_data:
def fake():
return DataSet([], [], fake_data=True, one_hot=one_hot, dtype=dtype)
data_sets.train = fake()
data_sets.validation = fake()
data_sets.test = fake()
return data_sets
TRAIN_IMAGES = 'train-images-idx3-ubyte.gz'
TRAIN_LABELS = 'train-labels-idx1-ubyte.gz'
TEST_IMAGES = 't10k-images-idx3-ubyte.gz'
TEST_LABELS = 't10k-labels-idx1-ubyte.gz'
VALIDATION_SIZE = 5000
#local_file = maybe_download(TRAIN_IMAGES, train_dir)
local_file = train_dir + "/" + TRAIN_IMAGES
train_images = extract_images(local_file)
#local_file = maybe_download(TRAIN_LABELS, train_dir)
local_file = train_dir + "/" + TRAIN_LABELS
train_labels = extract_labels(local_file, one_hot=one_hot)
#local_file = maybe_download(TEST_IMAGES, train_dir)
local_file = train_dir + "/" + TEST_IMAGES
test_images = extract_images(local_file)
#local_file = maybe_download(TEST_LABELS, train_dir)
local_file = train_dir + "/" + TEST_LABELS
test_labels = extract_labels(local_file, one_hot=one_hot)
validation_images = train_images[:VALIDATION_SIZE]
validation_labels = train_labels[:VALIDATION_SIZE]
train_images = train_images[VALIDATION_SIZE:]
train_labels = train_labels[VALIDATION_SIZE:]
data_sets.train = DataSet(train_images, train_labels, dtype=dtype)
data_sets.validation = DataSet(validation_images, validation_labels,
dtype=dtype)
data_sets.test = DataSet(test_images, test_labels, dtype=dtype)
return data_sets
softmax 简单测试代码如下:
#导入Minst数据集
import input_data
mnist = input_data.read_data_sets("MINST_data",one_hot=True)
#导入tensorflow库
import tensorflow as tf
#输入变量,把28*28的图片变成一维数组(丢失结构信息)
x = tf.placeholder("float",[None,784])
#权重矩阵,把28*28=784的一维输入,变成0-9这10个数字的输出
w = tf.Variable(tf.zeros([784,10]))
#偏置
b = tf.Variable(tf.zeros([10]))
#核心运算,其实就是softmax(x*w+b)
y = tf.nn.softmax(tf.matmul(x,w) + b)
#这个是训练集的正确结果
y_ = tf.placeholder("float",[None,10])
#交叉熵,作为损失函数
cross_entropy = -tf.reduce_sum(y_ * tf.log(y))
#梯度下降算法,最小化交叉熵
train_step = tf.train.GradientDescentOptimizer(0.01).minimize(cross_entropy)
#初始化,在run之前必须进行的
init = tf.initialize_all_variables()
#创建session以便运算
sess = tf.Session()
sess.run(init)
#迭代1000次
for i in range(1000):
#获取训练数据集的图片输入和正确表示数字
batch_xs, batch_ys = mnist.train.next_batch(100)
#运行刚才建立的梯度下降算法,x赋值为图片输入,y_赋值为正确的表示数字
sess.run(train_step,feed_dict = {x:batch_xs, y_: batch_ys})
#tf.argmax获取最大值的索引。比较运算后的结果和本身结果是否相同。
#这步的结果应该是[1,1,1,1,1,1,1,1,0,1...........1,1,0,1]这种形式。
#1代表正确,0代表错误
correct_prediction = tf.equal(tf.argmax(y,1), tf.argmax(y_,1))
#tf.cast先将数据转换成float,防止求平均不准确。
#tf.reduce_mean由于只有一个参数,就是上面那个数组的平均值。
accuracy = tf.reduce_mean(tf.cast(correct_prediction,"float"))
#输出
print sess.run(accuracy,feed_dict={x:mnist.test.images,y_: mnist.test.labels})
这个程序就是了解简单的tensorflow流程,api可以参考https://www.tensorflow.org