#《深度学习原理与TensorFlow实战》04 CNN看懂世界
# 书源码地址:https://github.com/DeepVisionTeam/TensorFlowBook.git
# 视频讲座地址:http://edu.csdn.net/course/detail/5222
# win10 Tensorflow1.2.0 python3.6.1
# CUDA v8.0 cudnn-8.0-windows10-x64-v5.1
# 本地代码位置:D:\git\DeepLearning\TensorFlowBook\neural_style\neural_style.py
# https://github.com/DeepVisionTeam/TensorFlowBook/blob/master/neural_style/neural_style.py
# https://github.com/DeepVisionTeam/TensorFlowBook/blob/master/neural_style/flower.jpg
# https://github.com/DeepVisionTeam/TensorFlowBook/blob/master/neural_style/starry_night.jpg
# 当前目录下需要手动创建 out 目录,生成的5张图片在out目录中
# 手动下载 http://www.vlfeat.org/matconvnet/models/imagenet-vgg-verydeep-19.mat 到当前目录
# 需要修改weights[i][0][0][0][0]==>weights[i][0][0][2][0]
neural_style.py
import os
import sys
import numpy as np
import scipy.io
import tensorflow as tf
from PIL import Image
tf.app.flags.DEFINE_string('style_image', 'starry_night.jpg', 'style image')
tf.app.flags.DEFINE_string('content_image', 'flower.jpg', 'content image')
tf.app.flags.DEFINE_integer('epochs', 500, 'training epochs')
tf.app.flags.DEFINE_float('learning_rate', 0.5, 'learning rate')
FLAGS = tf.app.flags.FLAGS
STYLE_WEIGHT = 10.
CONTENT_WEIGHT = 1.
STYLE_LAYERS = ['relu1_1', 'relu2_1', 'relu3_1', 'relu4_1', 'relu5_1']
CONTENT_LAYERS = ['relu4_2']
_vgg_params = None
def vgg_params():
global _vgg_params
if _vgg_params is None:
file = 'imagenet-vgg-verydeep-19.mat'
if os.path.isfile(file):
_vgg_params = scipy.io.loadmat(file)
else:
sys.stderr.write('Please download imagenet-vgg-verydeep-19.mat from'
' http://www.vlfeat.org/matconvnet/models/imagenet-vgg-verydeep-19.mat\n')
sys.exit(1)
return _vgg_params
def vgg19(input_image):
layers = (
'conv1_1', 'relu1_1', 'conv1_2', 'relu1_2', 'pool1',
'conv2_1', 'relu2_1', 'conv2_2', 'relu2_2', 'pool2',
'conv3_1', 'relu3_1', 'conv3_2', 'relu3_2', 'conv3_3',
'relu3_3', 'conv3_4', 'relu3_4', 'pool3',
'conv4_1', 'relu4_1', 'conv4_2', 'relu4_2', 'conv4_3',
'relu4_3', 'conv4_4', 'relu4_4', 'pool4',
'conv5_1', 'relu5_1', 'conv5_2', 'relu5_2', 'conv5_3',
'relu5_3', 'conv5_4', 'relu5_4', 'pool5'
)
weights = vgg_params()['layers'][0]
net = input_image
network = {}
for i, name in enumerate(layers):
layer_type = name[:4]
if layer_type == 'conv':
kernels, bias = weights[i][0][0][2][0]
kernels = np.transpose(kernels, (1, 0, 2, 3))
conv = tf.nn.conv2d(net, tf.constant(kernels),
strides=(1, 1, 1, 1), padding='SAME',
name=name)
net = tf.nn.bias_add(conv, bias.reshape(-1))
net = tf.nn.relu(net)
elif layer_type == 'pool':
net = tf.nn.max_pool(net, ksize=(1, 2, 2, 1),
strides=(1, 2, 2, 1),
padding='SAME')
network[name] = net
return network
def content_loss(target_features, content_features):
_, height, width, channel = content_features.get_shape().as_list()
content_size = height * width * channel
return tf.nn.l2_loss(target_features - content_features) / content_size
def style_loss(target_features, style_features):
_, height, width, channel = target_features.get_shape().as_list()
size = height * width * channel
target_features = tf.reshape(target_features, (-1, channel))
target_gram = tf.matmul(tf.transpose(target_features),
target_features) / size
style_features = tf.reshape(style_features, (-1, channel))
style_gram = tf.matmul(tf.transpose(style_features),
style_features) / size
gram_size = channel * channel
return tf.nn.l2_loss(target_gram - style_gram) / gram_size
def total_loss(content_image, style_image, target_image):
style_feats = vgg19([style_image])
content_feats = vgg19([content_image])
target_feats = vgg19([target_image])
loss = 0.0
for layer in CONTENT_LAYERS:
layer_loss = content_loss(target_feats[layer], content_feats[layer])
loss += CONTENT_WEIGHT * layer_loss
for layer in STYLE_LAYERS:
layer_loss = style_loss(target_feats[layer], style_feats[layer])
loss += STYLE_WEIGHT * layer_loss
return loss
def stylize(style_image, content_image, learning_rate=0.1, epochs=500):
target = tf.Variable(content_image, dtype=tf.float32)
style_input = tf.constant(style_image, dtype=tf.float32)
content_input = tf.constant(content_image, dtype=tf.float32)
cost = total_loss(content_input, style_input, target)
train_op = tf.train.AdamOptimizer(learning_rate).minimize(cost)
with tf.Session() as sess:
tf.global_variables_initializer().run()
for i in range(epochs):
_, loss, target_image = sess.run([train_op, cost, target])
print("iter:%d, loss:%.9f" % (i, loss))
if (i + 1) % 100 == 0:
image = np.clip(target_image + 128.0, 0, 255).astype(np.uint8)
Image.fromarray(image).save("out/neural_%d.jpg" % (i + 1))
if __name__ == '__main__':
style = Image.open(FLAGS.style_image)
style = np.array(style).astype(np.float32) - 128.0
content = Image.open(FLAGS.content_image)
content = np.array(content).astype(np.float32) - 128.0
stylize(style, content, FLAGS.learning_rate, FLAGS.epochs)
'''
# 需要在neural_style.py同级目录创建out目录,否则,在
# Image.fromarray(image).save("out/neural_%d.jpg" % (i + 1))时会报错
iter:0, loss:15626503.000000000
iter:1, loss:14949413.000000000
iter:2, loss:14318100.000000000![这里写图片描述](https://img-blog.csdn.net/20170707133148507?watermark/2/text/aHR0cDovL2Jsb2cuY3Nkbi5uZXQvbG9uZ2pp/font/5a6L5L2T/fontsize/400/fill/I0JBQkFCMA==/dissolve/70/gravity/SouthEast)
iter:3, loss:13735171.000000000
iter:4, loss:13194825.000000000
...
iter:497, loss:553536.812500000
iter:498, loss:553092.062500000
iter:499, loss:552648.937500000
'''
生成图片效果