【keras】图片压缩自建训练集

最新推荐文章于 2024-06-23 20:28:38 发布

Big Orange...

最新推荐文章于 2024-06-23 20:28:38 发布

阅读量230

点赞数

分类专栏：深度学习 keras 文章标签： keras 深度学习 pytorch

本文链接：https://blog.csdn.net/liuzhicheng1845/article/details/120032694

版权

深度学习同时被 2 个专栏收录

6 篇文章 0 订阅

订阅专栏

keras

4 篇文章 0 订阅

订阅专栏

prepare.py

import numpy as np
import cv2
def divide(img,K):  #每一块的大小
  col = K*K
  nrows,ncols = img.shape
  R = int(nrows/K)
  C = int(ncols/K)
  vec = np.ones((R*C,col))
  row = 0
  for i in range(R):
    for j in range(C):
      vec[row,0:col] = img[i*K:(i+1)*K,j*K:(j+1)*K].reshape(1,col)
      row += 1
  return vec

wh0=100
wh=50
import os
dir_path='../../img'
names=os.listdir(dir_path)
data=np.ones(  (len(names)*3*int(wh0/wh)*int(wh0/wh),wh*wh)  )
print(  len(names)*3*int(wh0/wh)*int(wh0/wh),wh*wh  )
index=0
for file in names:
    filepath=os.path.join(dir_path,file)
    print(filepath)
    image = cv2.imread(filepath)
    image= cv2.resize(image,dsize=(wh0,wh0))

    r=image[:,:,0]
    g=image[:,:,1]
    b=image[:,:,2]

    r2=divide(r,wh)
    g2=divide(g,wh)
    b2=divide(b,wh)

    for i in range(r2.shape[0]):
        data[index+3*i  ,:]=r2[i,:]
        data[index+3*i+1,:]=g2[i,:]
        data[index+3*i+2,:]=b2[i,:]
    index=index+3*int(wh0/wh)*int(wh0/wh)
print(data.shape)
x_train = data.astype('float32') / 255.
np.savez('x_train',x_train=x_train,wh=wh,l=image.shape[0]/wh)

train.py

import keras
from keras import layers
from keras.datasets import mnist
import numpy as np
import cv2
npzfile=np.load('x_train.npz')
x_train=npzfile['x_train']
wh=npzfile['wh']#int(npzfile['wh']/npzfile['partion'])
print(wh)

data_dim=wh*wh
encoding_dim = wh*25  #编码维度 # 32 floats -> compression of factor 24.5, assuming the input is 784 floats
print(wh)
input_img = keras.Input(shape=(data_dim,))#This is our input image

encoded = layers.Dense(encoding_dim, activation='relu')(input_img)#编码层 #"encoded" is the encoded representation of the input
decoded = layers.Dense(data_dim, activation='sigmoid')(encoded)#编码、解码 #"decoded" is the lossy reconstruction of the input

#解码模型
autoencoder = keras.Model(input_img, decoded)# This model maps an input to its reconstruction
autoencoder.compile(optimizer='adam', loss='binary_crossentropy')#每像素二元交叉熵损失和 Adam 优化器
print(x_train.shape)
autoencoder.fit(x_train, x_train,#拟合
                epochs=60,#将数据使用多少遍
                batch_size=1,#将7500个数据分成多少份
                shuffle=True,
                validation_data=(x_train, x_train))
encoded_input = keras.Input(shape=(encoding_dim,))# This is our encoded (32-dimensional) input
autoencoder.save( filepath="modelResult.h5", overwrite=True, include_optimizer=True )

predict.py

import keras
from keras import layers
from keras.datasets import mnist
import numpy as np
import cv2
#数据读取
npzfile=np.load('x_train.npz')
x_train=npzfile['x_train']
wh=npzfile['wh']#int(npzfile['wh']/npzfile['partion'])
print(wh)

#数据处理
x_train = x_train.astype('float32') / 255.
x_train = x_train.reshape((len(x_train), np.prod(x_train.shape[1:])))

data_dim=wh*wh
encoding_dim = wh*25  #编码维度 # 32 floats -> compression of factor 24.5, assuming the input is 784 floats

input_img = keras.Input(shape=(data_dim,))#This is our input image#解码模型
encoded_input = keras.Input(shape=(encoding_dim,))# This is our encoded (32-dimensional) input
m=keras.models.load_model( "modelResult.h5" ).layers
encoder= keras.Model(input_img, m[1](input_img))#编码模型  # input_img 似乎没有参数#784
decoder = keras.Model(encoded_input, m[2](encoded_input))# Create the decoder model

encoded_imgs = encoder.predict(x_train)#32# 进行编码/解码测试 #Encode and decode some digits
decoded_imgs = decoder.predict(encoded_imgs)#784# Note that we take them from the *test* set
#https://blog.csdn.net/zhw864680355/article/details/103405677
'''
rgb=decoded_imgs.reshape(3,wh, wh)
result=255.*rgb.transpose((1,2,0))#getImg(rgb,wh,wh)
cv2.imwrite('test2.jpg',result)
'''
#图片效果展示 # Use Matplotlib (don't ask)
import matplotlib.pyplot as plt
n = 8  # How many digits we will display
plt.figure(figsize=(20, 4))
for i in range(n):# Display original
    ax = plt.subplot(2, n, i + 1)
    plt.imshow(x_train[i].reshape(wh, wh))
    plt.gray()
    ax.get_xaxis().set_visible(False)
    ax.get_yaxis().set_visible(False)

    # Display reconstruction
    ax = plt.subplot(2, n, i + 1 + n)
    plt.imshow(decoded_imgs[i].reshape(wh, wh))
    plt.gray()
    ax.get_xaxis().set_visible(False)
    ax.get_yaxis().set_visible(False)
plt.show()

Big Orange...

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
【keras】图片压缩自建训练集

prepare.pyimport numpy as npimport cv2def divide(img,K): #每一块的大小 col = K*K nrows,ncols = img.shape R = int(nrows/K) C = int(ncols/K) vec = np.ones((R*C,col)) row = 0 for i in range(R): for j in range(C): vec[row,0:col] = img[i*K
复制链接

扫一扫