Tenforflow之构建自己的cpkt训练模型

最新推荐文章于 2022-10-20 21:25:10 发布

csuzhaoqinghui

最新推荐文章于 2022-10-20 21:25:10 发布

阅读量3.5k

点赞数 1

分类专栏：深度学习文章标签：深度学习

本文链接：https://blog.csdn.net/csuzhaoqinghui/article/details/51839169

版权

深度学习专栏收录该内容

79 篇文章 3 订阅

订阅专栏

最近一直在弄步态识别的一些实务，忘记补发tensorflow的学习历程了。

进行准备说一说怎么使用谷歌的tensorflow构建属于自己的训练模型。

研究很久发现构建的过程和另一个深度学习框架Caffe相似。现在上代码：

############################################################################################  
#!/usr/bin/python2.7  
# -*- coding: utf-8 -*-  
#Author  : zhaoqinghui  
#Date    : 2016.5.10  
#Function:  1. 读取training_index.txt，整理出训练数据，实现next_batch
#2. 数据处理
#3. model建立
#4. 训练生成cpkt模型
##########################################################################################


import tensorflow as tf
import numpy as np
import math
import cv2
import sys
import os
import os.path
from scipy import ndimage


#-------read the training_index.txt--------#


training_index = './training_index.txt'
modelpath="./tmp/"
classnum=36
total_image = 6297*3
global_step = 0
global_idx = np.arange(total_image)
images_g = np.array((total_image, 784))
labels_g = np.array((total_image,classnum))
max_epoch = 5000
def read_traing_list():
	train_image_dir = []
	train_label_dir = []
	reader = open(training_index)
	while 1:
		line = reader.readline()
                #print line
		tmp = line.split(" ")
		# print tmp
		if not line:
			break
		train_image_dir.append(tmp[0])
		train_label_dir.append(tmp[1][0:-1])
	#print train_image_dir[1:total_image]
	#print train_label_dir[1:total_image]
	return train_image_dir, train_label_dir

#------run the preprocess-------#

class Dadaset(object):
	def __init__(self, image, label,dtype=tf.float32):
		self._image = image
		self.label = label
	@property
	def image(self):
	    return self._image
	@property
	def label(self):
	    return self._label

#------中心化操作--------

def getBestShift(img):
	cy,cx = ndimage.measurements.center_of_mass(img)
	rows,cols = img.shape
	shiftx = np.round(cols/2.0-cx).astype(int)
	shifty = np.round(rows/2.0-cy).astype(int)
	return shiftx, shifty

def shift(img,shiftx,shifty):
	rows, cols = img.shape
	M = np.float32([[1,0,shiftx],[0,1,shifty]])
	shifted = cv2.warpAffine(img,M,(cols,rows))
	return shifted	

def read_image():
	train_image_dir, train_label_dir = read_traing_list()
	images = []
	labels = []
        ss=[]
	index = 0
	global images_g
	global labels_g
	#print len(train_image_dir)
	for idx in range(len(train_image_dir)):
		image_tmp = cv2.imread(str(train_image_dir[idx]),cv2.IMREAD_GRAYSCALE)
                shiftx, shifty = getBestShift(image_tmp)
	        gray = shift(image_tmp,shiftx,shifty)
                print train_image_dir[idx],train_label_dir[idx]
                #cv2.imshow("1",image_tmp)
                #cv2.waitKey(12)
		# print "jjgjg",image_tmp.shape
		label_tmp = int(str(train_label_dir[idx]))
		label_tmp2 = [0]*classnum
		label_tmp2[label_tmp] = 1
		images.append(image_tmp.flatten()/255.0)
		# print label_tmp
		# print "label:", label_tmp2
		# print "label len:", len(labels)
		labels.append(label_tmp2)
                ss.append(train_image_dir[idx])
		index += 1	
        print ss[100],labels[100]
	images = np.array(images)
	labels = np.array(labels)
	images_g = images
	labels_g = labels
	return images, labels

# read_image()



def next_batch(batch_size):
	global global_step
	global labels_g
	global images_g
	print global_step
	global global_idx
	# print labels_g.shape
	start = batch_size * global_step
	end = batch_size * (global_step+1)
	global_step += 1
	if(end >= total_image):
		np.random.shuffle(global_idx)
		global_step = 0
		start = 0
		end = batch_size
		images_g[:] = images_g[global_idx]
		labels_g[:] = labels_g[global_idx]
		print images_g.shape
	return images_g[start:end], labels_g[start:end]

def generate_test_image(test_size):

	global images_g
	global labels_g
	global global_idx
	np.random.shuffle(global_idx)
	images_g[:] = images_g[global_idx]
	labels_g[:] = labels_g[global_idx]
	return images_g[0:test_size], labels_g[0:test_size]

#--------run CNN model-----#

def CNNmodel():
	x = tf.placeholder(tf.float32,[None,28*28])
	y_ = tf.placeholder(tf.float32,[None,classnum])
	def weight_variable(shape):
		init = tf.truncated_normal(shape,stddev = 0.1)
		return tf.Variable(init)
	def bias_variable(shape):
		init = tf.constant(0.1, shape = shape)
		return tf.Variable(init)

	## 声明卷积操作和pool操作
	## 在这里声明的卷积操作是步长为1，padding为0的vanilla版本
	## pool操作是2X2的max pool
	def conv2d(x,W):
		# strides:[batch, in_height, in_width, in_channels]
		return tf.nn.conv2d(x,W,strides = [1,1,1,1],padding = 'SAME')

	def maxpool2d(x):
		return tf.nn.max_pool(x,ksize = [1,2,2,1], strides = [1,2,2,1],padding = 'SAME')

	## model构建过程
	# 第一层是[一个卷积接一个max pooling], 卷积层的patch_size 是 5X5的，输入的通道数目是1(因为是灰度图)，输出是32个feature maps
	# [5,5,1,32]: patch_size是5x5，输入通道数目是1，输出通道的数目是32(此处的32是根据网络定义得来，非计算得到)
	x_image = tf.reshape(x,[-1,28,28,1]) #变成需要的格式

	W_conv1 = weight_variable([5,5,1,32])
	b_conv1 = bias_variable([32])

	#做相应的操作,conv, relu, maxpool
	h_conv1 = tf.nn.relu(conv2d(x_image,W_conv1)+b_conv1)
	h_pool1 = maxpool2d(h_conv1)

	# 第二层[一个卷积加一个maxpool]
	W_conv2 = weight_variable([5,5,32,64])
	b_conv2 = bias_variable([64])

	h_conv2 = tf.nn.relu(conv2d(h_pool1,W_conv2)+b_conv2)
	h_pool2 = maxpool2d(h_conv2)

	# 全连接层，共有1024个神经元，此时图片进行了两次2x2的maxpool，每次的步长是2，此时图片已经变为了7X7

	W_fc1 = weight_variable([7*7*64,1024])
	b_fc1 = bias_variable([1024])

	h_pool2_flat = tf.reshape(h_pool2,[-1,7*7*64])
	h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat,W_fc1)+b_fc1)

	# 在训练时加入dropout，在测试的时候记得要关闭哦。。。
	# keep_prob 表示的是保留参数的可能性，当等于1.0时表示不进行dropout
	keep_prob = tf.placeholder("float") #要输入的值

	h_fc1_drop = tf.nn.dropout(h_fc1,keep_prob)

	#添加 softmax层

	W_fc2 = weight_variable([1024,classnum])
	b_fc2 = bias_variable([classnum])

	y_conv = tf.nn.softmax(tf.matmul(h_fc1_drop,W_fc2)+b_fc2)

	# loss 

	cross_entropy = -tf.reduce_sum(y_*tf.log(y_conv))

	train_step = tf.train.AdamOptimizer(1e-4).minimize(cross_entropy)

	correct_prediction = tf.equal(tf.argmax(y_conv,1),tf.argmax(y_,1))

	accuracy = tf.reduce_mean(tf.cast(correct_prediction,"float"))

	predict = [tf.reduce_max(y_conv),tf.argmax(y_conv,1)[0]]

	saver = tf.train.Saver()
	checkpoint_dir = modelpath+'train_model.cpkt'
        if not os.path.exists(modelpath) or os.path.isfile(modelpath):
           os.makedirs(modelpath)
	sess = tf.InteractiveSession()

	sess.run(tf.initialize_all_variables())

	for idx in range(max_epoch):
		imagess, labelss = next_batch(classnum*2)
		if idx%classnum == 0:
			acc = sess.run(accuracy,feed_dict={x:imagess,y_: labelss,keep_prob:1.0}) 
                        if acc == 1.0:
                           break
			print "At epoch %d, acc is %lf" % (idx,acc)
		sess.run(train_step,feed_dict={x:imagess,y_: labelss,keep_prob:0.5})
	saver.save(sess,checkpoint_dir)
	test_image,test_label = generate_test_image(900)
	print "Total test acc: ", sess.run(accuracy,feed_dict={x:test_image,y_:test_label,keep_prob:1.0})

if __name__ == '__main__':
	read_image()
	CNNmodel()

我采用比较简单的方法，这次没有使用tfrecord数据集，直接opencv采用的读取图片的方法，建立图片列表，再把图片列表丢入CNN模型进行训练可得到结果cpkt。raining_index.txt内容如图