python-keras图像多标签分类模型训练

AXingSong

已于 2022-10-10 15:32:28 修改

阅读量1.6k

点赞数

文章标签：深度学习 tensorflow 人工智能 keras

于 2022-10-09 15:57:50 首次发布

本文链接：https://blog.csdn.net/AXingSong/article/details/127222482

版权

CSDN话题挑战赛第2期
参赛话题：学习笔记

最近在学习给图像打标签训练，记录一下自己整个过程。

在python中有数据包Tensorflow-keras可以进行模型训练

数据集可以是自己采集也可以下载网络上的数据集

1.将image和其对应的labels进行处理，写入excel表

2.获取所有图像进行读取，裁剪，转化为数组

# image_list 是图像列表
# data 是存放图像数组列表
# labels 是图像对应标签的列表
for imagePath in image_list:
	image = cv2.imread(imagePath)
	image = cv2.resize(image, (writh, height))
	image = img_to_array(image)
	data.append(image)
    label = image_dict[imagePath].split(',')
	labels.append(label)

3.将data和labels列表转为数组

data = np.array(data, dtype="float") / 255.0
labels = np.array(labels)

4.labels进行独热编码

mlb = MultiLabelBinarizer()
labels = mlb.fit_transform(labels)

5.随机划分训练集和测试集

(trainX, testX, trainY, testY) = train_test_split(data, labels, test_size=0.2, random_state=42)

6.定义多标签分类网络架构smallervggnet

model = SmallerVGGNet.build(width=IMAGE_DIMS[1], height=IMAGE_DIMS[0], depth=IMAGE_DIMS[2], classes=len(mlb.classes_), finalAct="sigmoid")
model.compile(loss="binary_crossentropy", optimizer=opt, metrics=["accuracy"])
H = model.fit_generator(aug.flow(trainX, trainY, batch_size=BS), validation_data=(testX, testY), steps_per_epoch=len(trainX) // BS, epochs=EPOCHS, verbose=1)
model.save(args["model"])

以上就是整体流程

smallervggnet.py文件

# import the necessary packages
from keras.models import Sequential
from keras.layers.normalization.batch_normalization_v1 import BatchNormalization
from keras.layers.convolutional import Conv2D
from keras.layers.convolutional import MaxPooling2D
from keras.layers.core import Activation
from keras.layers.core import Flatten
from keras.layers.core import Dropout
from keras.layers.core import Dense
from keras import backend as K

class SmallerVGGNet:
	@staticmethod
	def build(width, height, depth, classes, finalAct="softmax"):
		# initialize the model along with the input shape to be
		# "channels last" and the channels dimension itself
		model = Sequential()
		inputShape = (height, width, depth)
		chanDim = -1

		# if we are using "channels first", update the input shape
		# and channels dimension
		if K.image_data_format() == "channels_first":
			inputShape = (depth, height, width)
			chanDim = 1

		# CONV => RELU => POOL
		model.add(Conv2D(32, (3, 3), padding="same",
			input_shape=inputShape))
		model.add(Activation("relu"))
		model.add(BatchNormalization(axis=chanDim))
		model.add(MaxPooling2D(pool_size=(3, 3)))
		model.add(Dropout(0.25))

		# (CONV => RELU) * 2 => POOL
		model.add(Conv2D(64, (3, 3), padding="same"))
		model.add(Activation("relu"))
		model.add(BatchNormalization(axis=chanDim))
		model.add(Conv2D(64, (3, 3), padding="same"))
		model.add(Activation("relu"))
		model.add(BatchNormalization(axis=chanDim))
		model.add(MaxPooling2D(pool_size=(2, 2)))
		model.add(Dropout(0.25))

		# (CONV => RELU) * 2 => POOL
		model.add(Conv2D(128, (3, 3), padding="same"))
		model.add(Activation("relu"))
		model.add(BatchNormalization(axis=chanDim))
		model.add(Conv2D(128, (3, 3), padding="same"))
		model.add(Activation("relu"))
		model.add(BatchNormalization(axis=chanDim))
		model.add(MaxPooling2D(pool_size=(2, 2)))
		model.add(Dropout(0.25))

		# first (and only) set of FC => RELU layers
		model.add(Flatten())
		model.add(Dense(1024))
		model.add(Activation("relu"))
		model.add(BatchNormalization())
		model.add(Dropout(0.5))

		# softmax classifier
		model.add(Dense(classes))
		model.add(Activation(finalAct))

		# return the constructed network architecture
		return model

需要导入的包

from keras.preprocessing.image import ImageDataGenerator
from keras.optimizers import adam_v2
from keras.preprocessing.image import img_to_array
from sklearn.preprocessing import MultiLabelBinarizer
from sklearn.model_selection import train_test_split
from pyimagesearch.smallervggnet import SmallerVGGNet
import matplotlib.pyplot as plt

文章参考：GitHub - MichaelCai311/keras-multi-label: Multi-label classification with Keras