数据集地址,这份数据集是猫的图片和狗的图片,是谷歌摘取了一部分Kaggle的猫狗分类图片集。这次我们并没有给出制作好的数据集,而是只有放在两个不同文件夹内的猫和狗的图片。
我们第一步先用PIL把图片格式统一一下,我们这里将像素改为(150*150)。
import os
from PIL import Image
base_dir = './dataset/cats_and_dogs_filtered'
train_dir = os.path.join(base_dir, 'train')
validation_dir = os.path.join(base_dir, 'validation')
train_cats_dir = os.path.join(train_dir, 'cats/')
train_dogs_dir = os.path.join(train_dir, 'dogs/')
validation_cats_dir = os.path.join(validation_dir, 'cats/')
validation_dogs_dir = os.path.join(validation_dir, 'dogs/')
train_cat_fnames = os.listdir(train_cats_dir)
train_dog_fnames = os.listdir(train_dogs_dir)
validation_cat_fnames = os.listdir(validation_cats_dir)
validation_dog_fnames = os.listdir(validation_dogs_dir)
os.mkdir(train_dir + '/resize_cats')
os.mkdir(train_dir + '/resize_dogs')
os.mkdir(validation_dir + '/resize_cats')
os.mkdir(validation_dir + '/resize_dogs')
for i in train_cat_fnames:
original_img = Image.open(train_cats_dir+i)
clipping_img = original_img.resize((150, 150), Image.ANTIALIAS)
clipping_img.save(train_dir+'/resize_cats/'+i)
for i in train_dog_fnames:
original_img = Image.open(train_dogs_dir + i)
clipping_img = original_img.resize((150, 150), Image.ANTIALIAS)
clipping_img.save(train_dir + '/resize_dogs/' + i)
for i in validation_cat_fnames:
original_img = Image.open(validation_cats_dir + i)
clipping_img = original_img.resize((150, 150), Image.ANTIALIAS)
clipping_img.save(validation_dir + '/resize_cats/' + i)
for i in validation_dog_fnames:
original_img = Image.open(validation_dogs_dir + i)
clipping_img = original_img.resize((150, 150), Image.ANTIALIAS)
clipping_img.save(validation_dir + '/resize_dogs/' + i)
下一步我们将猫狗图片制作成tfrecords格式的文件。
import os
import tensorflow as tf
from PIL import Image
cwd = './dataset/cats_and_dogs_filtered/train/'
classes = ('