原文地址:https://www.cnblogs.com/ningskyer/articles/7606174.html
画出数字
from sklearn.datasets import load_digits
digits=load_digits()
fig=plt.figure(figsize=(6,6))
fig.subplots_adjust(left=0,right=1,bottom=0,top=1,hspace=0.05,wspace=0.05)
#绘制数字:每张图像8*8像素点
for i in range(64):
ax=fig.add_subplot(8,8,i+1,xticks=[],yticks=[])
ax.imshow(digits.images[i],cmap=plt.cm.binary,interpolation='nearest')
#用目标值标记图像
ax.text(0,7,str(digits.target[i]))
plt.show()
使用logisticRegression识别手写数字,使用load_digits()
%%writefile d:/python/shou_xie_shi_bie_by_logisticRegression.py
from sklearn.linear_model import LogisticRegression
from sklearn import datasets
from sklearn.cross_validation import train_test_split
from sklearn.metrics import confusion_matrix,accuracy_score
import numpy as np
import scipy
import cv2
from fractions import Fraction
import matplotlib.pyplot as plt
#中文字体显示
plt.rc('font', family='SimHei', size=13)
def image2Digit(image):
# 调整为8*8大小
im_resized = scipy.misc.imresize(image, (8,8))
# RGB(三维)转为灰度图(一维)
im_gray = cv2.cvtColor(im_resized, cv2.COLOR_BGR2GRAY)
# 调整为0-16之间(digits训练数据的特征规格)像素值——16/255
im_hex = Fraction(16,255) * im_gray
# 将图片数据反相(digits训练数据的特征规格——黑底白字)
im_reverse = 16 - im_hex
return im_reverse.astype(np.int)
# 加载数字数据
digits = datasets.load_digits()
# 划分训练集与验证集
Xtrain, Xtest, ytrain, ytest = train_test_split(digits.data, digits.target, random_state=2)
# 创建模型
clf = LogisticRegression(penalty='l2')
# 拟合数据训练
clf.fit(Xtrain, ytrain)
# 预测验证集
ypred = clf.predict(Xtest)
# 计算准确度
accuracy = accuracy_score(ytest, ypred)
print '识别准确度:',accuracy
# 读取单张自定义手写数字的图片
image = scipy.misc.imread("d:/python/4.png")
# 将图片转为digits训练数据的规格——即数据的表征方式要统一
im_reverse = image2Digit(image)
# 显示图片转换后的像素值
print(im_reverse)
# 8*8转为1*64(预测方法的参数要求)
reshaped = im_reverse.reshape(1,64)
# 预测
result = clf.predict(reshaped)
print(result)
测试图片如下: