from sklearn import datasets#自带的数据集
from sklearn.model_selection import train_test_split,cross_val_score
from sklearn.neighbors import KNeighborsClassifier
import matplotlib.pyplot as plt
iris=datasets.load_iris()#加载sklearn自带的数据集鸢尾花
X=iris.data#数据
y=iris.target#数据对应的标签
train_X,test_X,train_y,test_y=train_test_split(X,y,test_size=1/3,random_state=3)
k_range=range(1,31)
cv_scores=[]#用来放结果
for n in k_range:
knn=KNeighborsClassifier(n)#knn模型,这里一个超参数可以做预测,当有多个超参数时应使用另一种方法:GridSearchCV
scores=cross_val_score(knn,train_X,train_y,cv=10,scoring='accuracy')
#cv:选择每次测试折数 accuracy:评价指标是准确度,可以省略使用默认值
cv_scores.append(scores.mean())
plt.plot(k_range,cv_scores)
plt.xlabel('K')
plt.ylabel('Accuracy')
plt.show()