0到9十个数字,每个数字有500张图片,datanumber文件下面有10个文件夹,分别对应0到9这10个数字的文件夹,每个子文件夹下面有对应数字的500张图片
import numpy as np
from sklearn.neighbors import KNeighborsClassifier
# 读取图片
import matplotlib.image as mpimg
# 显示图片
import matplotlib.pyplot as plt
from matplotlib.colors import ListedColormap
import pandas as pd
path=r"E:\study\data\datanumber"
X_train=[]
Y_train=[]
X_test=[]
Y_test=[]
# 加载1到9,每个数字里面的500张图片 小于480用于训练,大于480用于测试
# 并把二维数组转为一维数组
for i in range(1,9):
for j in range(1,501):
if j<480:
X_train.append(mpimg.imread(path+"\\%d\\%d_%d.bmp" %(i,i,j)).reshape(-1))
Y_train.append(i)
else:
X_test.append(mpimg.imread(path+"\\%d\\%d_%d.bmp" %(i,i,j)).reshape(-1))
Y_test.append(i)
# 转化成numpy类型的数组
X_train=np.array(X_train)
Y_train=np.array(Y_train)
X_test=np.array(X_test)
Y_test=np.array(Y_test)