def datingClassTest():
hoRatio = 0.10 #测试数据占总数据的百分比
datingDataMat, datingLabels = file2matrix('datingTestSet2.txt') #将文本信息转成numpy格式
normMat, ranges, minVals = autoNorm(datingDataMat) #将datingDataMat数据归一化
m = normMat.shape[0] #取normMat的行数
numTestVecs = int(m*hoRatio) #测试数据的行数
errorCount = 0.0 #错误数据数量
for i in range(numTestVecs):
classifierResult = classify0(normMat[i,:], normMat[numTestVecs:m, :], datingLabels[numTestVecs:m], 3)
print("the classifier came back with: %d, the real answer is: %d" %(classifierResult, datingLabels[i]))
if (classifierResult != datingLabels[i]):errorCount += 1.0 #分类器结果和原标签不一样,则errorCount加1
print("the total error rate is : %f" %(errorCount/float(numTestVecs)))
the classifier came back with: 3, the real answer is: 3
the classifier came back with: 2, the real answer is: 2
the classifier came back with: 1, the real answer is: 1
the classifier came back with: 3, the real answer is: 1
the total error rate is : 0.050000