使用CNN训练人脸标签图片分类

最新推荐文章于 2024-06-03 13:31:43 发布

鸿运齐天蛊

最新推荐文章于 2024-06-03 13:31:43 发布

阅读量392

点赞数 18

文章标签： cnn 人工智能神经网络

本文链接：https://blog.csdn.net/jingshi123456/article/details/138705446

版权

数据集处理

1.新建一个文件夹

2.图片

把不同类型的图片放在对应的文件夹中，文件夹的命名就是图片的标签

1.导包

from tensorflow.keras.preprocessing.image import ImageDataGenerator
import pathlib
import matplotlib.pyplot as plt
import numpy as np
import tensorflow as tf
from tensorflow.keras import layers, models

2.定义超参数

# 定义超参数

#用于指定存储图像数据的位置
data_dir = "D:/lx/"
data_dir = pathlib.Path(data_dir)
image_count = len(list(data_dir.glob('*/*.jpg')))
print("图片总数为：", image_count)

#这是一个整数变量，表示在训练模型时每个批次的图像数量。批量大小是训练神经网络时一个重要的超参数，它影响了模型的收敛速度和稳定性。
batch_size = 32

#有的图像在训练之前将被统一调整为180x180像素的大小。
img_height = 180
img_width = 180

3.加载数据

# 使用image_dataset_from_directory()将数据加载到tf.data.Dataset中

#创建了一个训练数据集。函数的参数包括：
#data_dir：之前定义的图像数据目录路径。
#validation_split=0.2：指定从数据集中划分出20%作为验证集。
#subset="training"：指示这个数据集是用于训练的。
#seed=123：设置随机种子，以确保数据集划分的可重复性。
#image_size=(img_height, img_width)：指定图像的大小。
#batch_size=batch_size：指定每个批次的图像数量，这里使用之前定义的batch_size。

train_ds = tf.keras.preprocessing.image_dataset_from_directory(
    data_dir,
    validation_split=0.2,  # 验证集0.2
    subset="training",
    seed=123,
    image_size=(img_height, img_width),
    batch_size=batch_size)



#创建了一个验证数据集
val_ds = tf.keras.preprocessing.image_dataset_from_directory(
    data_dir,
    validation_split=0.2,
    subset="validation",
    seed=123,
    image_size=(img_height, img_width),
    batch_size=batch_size)

#从训练数据集中获取类别名称列表。这些类别名称是数据集中子目录的名称，每个子目录包含同一类别的图像。
class_names = train_ds.class_names

print(class_names)

4.可视化

plt.figure(figsize=(16, 8))
for images, labels in train_ds.take(1):
    for i in range(16):
        ax = plt.subplot(4, 4, i + 1)
        # plt.imshow(images[i], cmap=plt.cm.binary)
        plt.imshow(images[i].numpy().astype("uint8"))
        #为每个子图设置标题，标题是图像对应的类别名称。labels[i]是图像的标签（一个整数）
        plt.title(class_names[labels[i]])
        plt.axis("off")
plt.show()

5.构建图像增强生成器

# 再次检查数据
for image_batch, labels_batch in train_ds:
    print(image_batch.shape)
    print(labels_batch.shape)
    break

# 构建图像加强生成器
# -确保模型能很好地泛化，我建议您始终执行数据增强。
#它是一个图像数据增强工具。这个生成器可以随机变换图像，以增加训练数据的多样性，从而提高模型的泛化能力。
参数包括：
#Rotation_range=30：随机旋转图像的角度范围。
#width_shift_range=0.1：图像水平方向上随机平移的范围（相对于总宽度的比例）。
#height_shift_range=0.1：图像垂直方向上随机平移的范围（相对于总高度的比例）。
#shear_range=0.2：随机错切变换的范围。
#zoom_range=0.2：随机缩放图像的范围。
#horizontal_flip=True：随机水平翻转图像。
#fill_mode="nearest"：填充新创建像素的方法。
#x = aug.flow(image_batch, labels_batch)：使用aug生成器对第一个批次的图像和标签进行实时增强。flow()方法接受图像和标签，返回一个批量增强数据的Numpy数组。

aug = ImageDataGenerator(rotation_range=30, width_shift_range=0.1,
                         height_shift_range=0.1, shear_range=0.2, zoom_range=0.2,
                         horizontal_flip=True, fill_mode="nearest")
x = aug.flow(image_batch, labels_batch)

#这是一个TensorFlow推荐的用于优化数据管道的性能的参数。它可以自动调整内部缓冲区的大小，以最大化数据加载和处理的效率。
AUTOTUNE = tf.data.AUTOTUNE

6.缓存和优化数据集

# 将数据集缓存到内存中，加快速度
train_ds = train_ds.cache().shuffle(1000).prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)

7.构建模型

# 为了增加模型的泛化能力，增加了Dropout层，并将最大池化层更新为平均池化层
num_classes = 3
model = models.Sequential([
    layers.experimental.preprocessing.Rescaling(1. / 255, input_shape=(img_height, img_width, 3)),
    layers.Conv2D(32, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Conv2D(64, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Conv2D(128, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Conv2D(256, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Flatten(),
    layers.Dense(512, activation='relu'),
    layers.Dense(num_classes)
])

8.编译训练模型

# 设置优化器
opt = tf.keras.optimizers.Adam(learning_rate=0.001)

model.compile(optimizer=opt,
              loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
              metrics=['accuracy'])

EPOCHS = 100
BS = 5

# 训练网络
# model.fit 可同时处理训练和即时扩充的增强数据。
# 我们必须将训练数据作为第一个参数传递给生成器。生成器将根据我们先前进行的设置生成批量的增强训练数据。
for images_train, labels_train in train_ds:
    continue
for images_test, labels_test in val_ds:
    continue
history = model.fit(x=aug.flow(images_train,labels_train, batch_size=BS),
                    validation_data=(images_test, labels_test), steps_per_epoch=1,
                    epochs=EPOCHS)

9.评估模型

# 画出训练精确度和损失图
N = np.arange(0, EPOCHS)
plt.style.use("ggplot")
plt.figure()
plt.plot(N, history.history["loss"], label="train_loss")
plt.plot(N, history.history["val_loss"], label="val_loss")
plt.plot(N, history.history["accuracy"], label="train_acc")
plt.plot(N, history.history["val_accuracy"], label="val_acc")
plt.title("Aug Training Loss and Accuracy")
plt.xlabel("Epoch #")
plt.ylabel("Loss/Accuracy")
plt.legend(loc='upper right')  # legend显示位置
plt.show()

test_loss, test_acc = model.evaluate(val_ds, verbose=2)
print(test_loss, test_acc)

10.可视化结果

# 优化2 输出在验证集上的预测结果和真实值的对比
pre = model.predict(val_ds)
for images, labels in val_ds.take(1):
    for i in range(4):
        ax = plt.subplot(1, 4, i + 1)
        plt.imshow(images[i].numpy().astype("uint8"))
        plt.title(class_names[labels[i]])
        plt.xticks([])
        plt.yticks([])
        # plt.xlabel('pre: ' + class_names[np.argmax(pre[i])] + ' real: ' + class_names[labels[i]])
        plt.xlabel('pre: ' + class_names[np.argmax(pre[i])])
        print('pre: ' + str(class_names[np.argmax(pre[i])]) + ' real: ' + class_names[labels[i]])
plt.show()

print(labels_test)
print(labels)
print(pre)
print(class_names)

11.输出分类广告

from sklearn.metrics import classification_report
# 优化1 输出可视化报表
print(classification_report(labels_test,
                            pre.argmax(axis=1), target_names=class_names))

12.全部代码

from tensorflow.keras.preprocessing.image import ImageDataGenerator
import pathlib
import matplotlib.pyplot as plt
import numpy as np
import tensorflow as tf
from tensorflow.keras import layers, models

# 定义超参数
data_dir = "D:/lx/"
data_dir = pathlib.Path(data_dir)
image_count = len(list(data_dir.glob('*/*.jpg')))
print("图片总数为：", image_count)
batch_size = 32
img_height = 180
img_width = 180

# 使用image_dataset_from_directory()将数据加载到tf.data.Dataset中
train_ds = tf.keras.preprocessing.image_dataset_from_directory(
    data_dir,
    validation_split=0.2,  # 验证集0.2
    subset="training",
    seed=123,
    image_size=(img_height, img_width),
    batch_size=batch_size)

val_ds = tf.keras.preprocessing.image_dataset_from_directory(
    data_dir,
    validation_split=0.2,
    subset="validation",
    seed=123,
    image_size=(img_height, img_width),
    batch_size=batch_size)

class_names = train_ds.class_names
print(class_names)

# 可视化
plt.figure(figsize=(16, 8))
for images, labels in train_ds.take(1):
    for i in range(16):
        ax = plt.subplot(4, 4, i + 1)
        # plt.imshow(images[i], cmap=plt.cm.binary)
        plt.imshow(images[i].numpy().astype("uint8"))
        plt.title(class_names[labels[i]])
        plt.axis("off")
plt.show()

# 再次检查数据
for image_batch, labels_batch in train_ds:
    print(image_batch.shape)
    print(labels_batch.shape)
    break

# 构建图像加强生成器
# 图像增强使我们可以通过随机旋转，移动，剪切，缩放和翻转从现有的训练数据中构建“其他”训练数据。
# 数据扩充通常是以下关键步骤：
# -避免过度拟合
# -确保模型能很好地泛化  我建议您始终执行数据增强，除非您有明确的理由不这样做。
aug = ImageDataGenerator(rotation_range=30, width_shift_range=0.1,
                         height_shift_range=0.1, shear_range=0.2, zoom_range=0.2,
                         horizontal_flip=True, fill_mode="nearest")
x = aug.flow(image_batch, labels_batch)

AUTOTUNE = tf.data.AUTOTUNE

# 将数据集缓存到内存中，加快速度
train_ds = train_ds.cache().shuffle(1000).prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)



# 为了增加模型的泛化能力，增加了Dropout层，并将最大池化层更新为平均池化层
num_classes = 3
model = models.Sequential([
    layers.experimental.preprocessing.Rescaling(1. / 255, input_shape=(img_height, img_width, 3)),
    layers.Conv2D(32, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Conv2D(64, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Conv2D(128, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Conv2D(256, (3, 3), activation='relu'),
    layers.MaxPooling2D((2, 2)),
    layers.Flatten(),
    layers.Dense(512, activation='relu'),
    layers.Dense(num_classes)
])


model.summary()  # 打印网络结构

# 设置优化器
opt = tf.keras.optimizers.Adam(learning_rate=0.0001)

model.compile(optimizer=opt,
              loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
              metrics=['accuracy'])

EPOCHS = 100
BS = 30

# 训练网络
# model.fit 可同时处理训练和即时扩充的增强数据。
# 我们必须将训练数据作为第一个参数传递给生成器。生成器将根据我们先前进行的设置生成批量的增强训练数据。
for images_train, labels_train in train_ds:
    continue
for images_test, labels_test in val_ds:
    continue
history = model.fit(x=aug.flow(images_train,labels_train, batch_size=BS),
                    validation_data=(images_test, labels_test), steps_per_epoch=1,
                    epochs=EPOCHS)

# 画出训练精确度和损失图
N = np.arange(0, EPOCHS)
plt.style.use("ggplot")
plt.figure()
plt.plot(N, history.history["loss"], label="train_loss")
plt.plot(N, history.history["val_loss"], label="val_loss")
plt.plot(N, history.history["accuracy"], label="train_acc")
plt.plot(N, history.history["val_accuracy"], label="val_acc")
plt.title("Aug Training Loss and Accuracy")
plt.xlabel("Epoch #")
plt.ylabel("Loss/Accuracy")
plt.legend(loc='upper right')  # legend显示位置
plt.show()

test_loss, test_acc = model.evaluate(val_ds, verbose=2)
print(test_loss, test_acc)

# 优化2 输出在验证集上的预测结果和真实值的对比
pre = model.predict(val_ds)
for images, labels in val_ds.take(1):
    for i in range(4):
        ax = plt.subplot(1, 4, i + 1)
        plt.imshow(images[i].numpy().astype("uint8"))
        plt.title(class_names[labels[i]])
        plt.xticks([])
        plt.yticks([])
        # plt.xlabel('pre: ' + class_names[np.argmax(pre[i])] + ' real: ' + class_names[labels[i]])
        plt.xlabel('pre: ' + class_names[np.argmax(pre[i])])
        print('pre: ' + str(class_names[np.argmax(pre[i])]) + ' real: ' + class_names[labels[i]])
plt.show()

print(labels_test)
print(labels)
print(pre)
print(class_names)
from sklearn.metrics import classification_report
# 优化1 输出可视化报表
print(classification_report(labels_test,
                            pre.argmax(axis=1), target_names=class_names))

代码实习效果：

图片标签展示

准确率和损失函数

预测和分类报告

鸿运齐天蛊

关注

18
点赞
踩
3

收藏

觉得还不错? 一键收藏
1
评论
使用CNN训练人脸标签图片分类

定义超参数#用于指定存储图像数据的位置print("图片总数为：", image_count)#这是一个整数变量，表示在训练模型时每个批次的图像数量。批量大小是训练神经网络时一个重要的超参数，它影响了模型的收敛速度和稳定性。#有的图像在训练之前将被统一调整为180x180像素的大小。
复制链接

扫一扫