变分自编码器（VAE）代码

最新推荐文章于 2024-05-02 22:33:25 发布

DL方少

最新推荐文章于 2024-05-02 22:33:25 发布

阅读量647

点赞数

分类专栏：深度学习文章标签：深度学习机器学习 tensorflow

本文链接：https://blog.csdn.net/qq_46439619/article/details/113705555

版权

深度学习专栏收录该内容

9 篇文章 0 订阅

订阅专栏

#VAE编码器网络
import tensorflow as tf
import  keras
from keras import  layers
from keras import  backend as K
from keras.models import Model
import numpy as np
from keras.datasets import mnist
import matplotlib.pyplot as plt
from  scipy.stats import  norm
img_shape=(28,28,1)
batch_size=16
latent_dim=2 #潜在空间的维度，一个二维平面
input_img=keras.Input(shape=img_shape)
x=layers.Conv2D(32,3,padding='same',activation='relu')(input_img)
x=layers.Conv2D(64,3,padding='same',activation='relu',strides=(2,2))(x)
x=layers.Conv2D(64,3,padding='same',activation='relu')(x)
x=layers.Conv2D(64,3,padding='same',activation='relu')(x)
shape_before_flattening=K.int_shape(x)
x=layers.Flatten()(x)
x=layers.Dense(32,activation='relu')(x)
#输入的图像最终编码为这两个参数
z_mean=layers.Dense(latent_dim)(x)
z_log_var=layers.Dense(latent_dim)(x)
#潜在空间采样函数
def sampling(args):
    z_mean,z_log_var=args
    epsilon=k.random_normal(shape=(K.shape(z_mean)[0],latent_dim),mean=0.,stddev=1.)
    return z_mean+K.exp(0.5*z_log_var)*epsilon
z=layers.Lambda(sampling)([z_mean,z_log_var])
#VAE解网器网络，将潜在空间点映射为图像
decoder_input=layers.Input(K.int_shape(z)[1:])#需要将z输入到这里
x=layers.Dense(np.prod(shape_before_flattening[1:]),activation='relu')(decoder_input)#对输入进行上采样
x=layers.Reshape(shape_before_flattening[1:])(x)#将z转换为特征图，使其形状与编码器模型最后一个Flatten层之前的特征图的形状相同
x=layers.Conv2DTranspose(32,3,padding='same',activation='relu',strides=(2,2))(x)#将z解码为与原始输入图具有相同尺寸的特征图
x=layers.Conv2D(1,3,padding='same',activation='sigmoid')(x)
decoder=Model(decoder_input,x)#将解码器模型实例化，它将decoder_input转换为解码后的图像
z_decoded=decoder(z)#将这个实例应用于z，得到解码后的z
class CustomVariationalLayer(keras.layers.Layer):
    def vea_loss(self,x,z_decoded):
        x=K.flatten(x)
        z_decoded=K.flatten(z_decoded)
        xent_loss=keras.metrics.binary_crossentropy(x,z_decoded)
        kl_loss=-5e-4*K.mean(1+z_log_var-K.square(z_mean)-K.exp(z_log_var),axis=1)
        return K.mean(xent_loss+kl_loss)
    def call(self,inputs):#通过编写一个call方法来实现自定义层
        x=inputs[0]
        z_decoded=inputs[1]
        loss=self.vae_loss(x,z_decoded)
        self.add_loss(loss,inputs=inputs)
        return x
y=CustomVariationalLayer()([input_img,z_decoded])#对输入和解码后的输出调用自定义层，以得到最终的模型输出
#训练VAE
vae=Model(input_img,y)
vae.compile(optimizer='rmsprop',loss=None)
vae.summary()
(x-train,_),(x_test,y_test)=minist.load_data()
x_train=x_train.astype('float32')/255.
x_train=x_train.reshape(x_train.reshape+(1,))
x_test=x_test.astype('float32')/255.
x_test=x_test.reshape(x_test.reshape+(1,))
vae.fit(x=x_train,y=None,shuffle=True,epochs=10,batch_size=batch_size,validation_data=(x_test,None))
#从二维潜在空间中采取一组点的网格，并将其解码为图像
n=15#显示15*15的数字网格
digit_size=28
figure=np.zeros((digit_size*n,digit_size*n))
grid_x=norm.ppf(np.linspace(0.05,0.95,n))
grid_y=norm.ppf(np.linspace(0.05,0.95,n))
for i,yi in enumerate(grid_x):
    for j,xi in enumerate(grid_y)
        z_sample=np.array([[xi,yi]])
        z_sample=np.tile(z_sample,batch_size).reshape(batch_size,2)
        x_decoded=decoder.predict(z_sample,batch_size=batch_size)
        digit=x_decoded[0].reshape(digit_size,digit_size)
        figure[i*digit_size:(i+i)*digit_size,j*digit_size:(j+1)*digit_size]=digit
plt.figure(figsize=(10,10))
plt.imshow(figure,cmap='Greys_r')
plt.show()

DL方少

关注

0
点赞
踩
3

收藏

觉得还不错? 一键收藏
0
评论
变分自编码器（VAE）代码

#VAE编码器网络import tensorflow as tfimport kerasfrom keras import layersfrom keras import backend as Kfrom keras.models import Modelimport numpy as npfrom keras.datasets import mnistimport matplotlib.pyplot as pltfrom scipy.stats import normimg_
复制链接

扫一扫