前言
做图像分类标注时,先标注一部分数据,然后计算这些图像的特征信息,见【代码篇】图像预处理阶段:提取图像特征,利用这些特征信息及分类标签训练一个决策树模型,最后再利用这个决策树模型分类剩下的数据,进而减少工作量。
训练决策树模型
import os
import pandas as pd
from sklearn import tree
import graphviz
import matplotlib.pyplot as plt
from sklearn.tree import DecisionTreeClassifier
from sklearn.externals import joblib
import utils
root_dir = "../Image-Downloader-master/download_images/gan/emoji_combine"
excel_path = "img_combine_info_type.xls"
data = pd.read_excel(excel_path, index_col=0)
columns = ["size", "area", "gradient", "si", "niqe", "colorful"]
color = {
"lr": "red", "hr": "blue", "other": "yellow"}
for column in columns:
for type_now in color.k