dataset ==map()
dataset 是一个 iterator (列表引子)
tf.data.Dataset.from_tensor_slices 将样本集中每一个样本|按行拆分样本集
拆分为 一个一个的样本,放在列表中迭代器中
import tensorflow as tf
import os
AUTOTUNE = tf.data.experimental.AUTOTUNE
num_epochs = 10
batch_size = 32
learning_rate = 0.001
#设置数据集位置
data_dir = os.getcwd() + os.sep + 'minidata/minidata'
train_cats_dir = data_dir + '/train/cats'
train_dogs_dir = data_dir + '/train/dogs'
#借助文件名获取指定的图片,还要同时给出对应的标签信息
def get_image_by_filename(filename,label):
image_data = tf.io.read_file(filename)
image_jpg = tf.image.decode_jpeg(image_data)
image_resized = tf.image.resize(image_jpg, [256,256])
image_scale = image_resized/255.0
return image_scale, label
if __name__ == '__main__':
tf_train_cats_filenames = tf.constant([train_cats_dir + '/' + filename for filename in os.listdir(train_cats_dir)])
tf_train_dogs_filenames = tf.constant([train_dogs_dir + '/' + filename for filename in os.listdir(train_dogs_dir)])
#拼接
tf_train_feature_filenames = tf.concat([tf_train_cats_filenames,tf_train_dogs_filenames],axis = -1)
tf_cats_labels = tf.zeros(tf_train_cats_filenames.shape,dtype = tf.int32)
tf_dogs_labels = tf.ones(tf_train_dogs_filenames.shape,dtype = tf.int32)
tf_train_labels = tf.concat([tf_cats_labels,tf_dogs_labels],axis = -1)
train_dataset = tf.data.Dataset.from_tensor_slices((tf_train_feature_filenames,tf_train_labels))
#map
train_dataset = train_dataset.map(map_func=get_image_by_filename, num_parallel_calls=AUTOTUNE)
for f,l in train_dataset:
print(f.numpy(), l.numpy())