dropout正则化方法
当一个网络出现过拟合,可以用dropout随机使一些节点失效,然后反向传播训练。
实施dropout方法
inverted dropout
用一个三层网络举例说明
import tensorflow as tf
from sklearn.datasets import load_digits
from sklearn.cross_validation import train_test_split
from sklearn.preprocessing import LabelBinarizer
digits=load_digits()
X=digits.data
y=digits.target
y=LabelBinarizer().fit_transform(y)
X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=.3)
def add_lay(input,in_size,out_size,layer_name,activation_function=None):
Weights=tf.Variable(tf.random_normal([in_size,out_size]))
biases=tf.Variable(tf.zeros([1,out_size])+0.1)
Wx_plus_b=tf.matmul(input,Weights)+biases
Wx_plus_b=tf.nn.dropout(Wx_plus_b,keep_prob)
if activation_function is None:
output=Wx_plus_b
else:
output=activation_function(Wx_plus_b)
tf.summary.histogram(layer_name+'/output',output)
return output
keep_prob=tf.placeholder(tf.float32)#一直保持多少的结果不被drop掉
xs=tf.placeholder(tf.float32,[None,64])
ys=tf.placeholder(tf.float32,[None,10])
l1=add_lay(xs,64,50,'l1',activation_function=tf.nn.tanh)#隐藏层
prediction=add_lay(l1,50,10,'l2',activation_function=tf.nn.softmax)#输出层
cross_entropy=tf.reduce_mean(-tf.reduce_sum(ys*tf.log(prediction),
reduction_indices=[1]))
tf.summary.scalar('loss',cross_entropy)
train_step=tf.train.GradientDescentOptimizer(0.6).minimize(cross_entropy)
init=tf.initialize_all_variables()
sess=tf.Session()
merged=tf.summary.merge_all()
train_writer=tf.summary.FileWriter('logs/train',sess.graph)
test_writer=tf.summary.FileWriter('logs/test',sess.graph)
sess.run(init)
for i in range(500):
sess.run(train_step,feed_dict={xs:X_train,ys:y_train,keep_prob:0.5})
if i%50==0:
train_result=sess.run(merged,feed_dict={xs:X_train,ys:y_train,keep_prob:1})
test_result=sess.run(merged,feed_dict={xs:X_test,ys:y_test,keep_prob:1})
train_writer.add_summary(train_result,i)
test_writer.add_summary(test_result, i)