https://www.cnblogs.com/wkslearner/p/9302044.html
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.neighbors import KNeighborsClassifier
#超参数网格搜索
from sklearn.model_selection import GridSearchCV
def knn_iris():
#1.获取数据集
iris = load_iris()
#print(iris)
#2.划分数据集
x_train,x_test,y_train,y_test = train_test_split(iris.data,iris.target,random_state=6)
#3.特征工程:标准化
transfor = StandardScaler()
x_train = transfor.fit_transform(x_train)
x_test = transfor.transform(x_test)
#KNN算法预估器
estimator = KNeighborsClassifier(n_neighbors=3)
estimator.fit(x_train,y_train)
#5.模型评估
#方法1:直接比对真实值和预估值
y_predict = estimator.predict(x_test)
print("y_predict:\n",y_predict)
print("直接对比真实值和预测值:\n",y_test == y_predict)
#方法2:计算准确率
score = estimator.score(x_test,y_test)
print("准确率为:\n",score)
return None
def knn_iris_gsch():
#1.获取数据集
iris = load_iris()
#print(iris)
#2.划分数据集
x_train,x_test,y_train,y_test = train_test_split(iris.data,iris.target,random_state=6)
#3.特征工程:标准化
transfor = StandardScaler()
x_train = transfor.fit_transform(x_train)
x_test = transfor.transform(x_test)
#KNN算法预估器
estimator = KNeighborsClassifier()
##超参数网格搜索
#参数准备
#para_dict = {'param_grid ':[1,3,5,7]}
param_dict=[1,2,3]
estimator = GridSearchCV(estimator,param_grid=param_dict,cv=10)
estimator.fit(x_train,y_train)
#5.模型评估
#方法1:直接比对真实值和预估值
y_predict = estimator.predict(x_test)
print("y_predict:\n",y_predict)
print("直接对比真实值和预测值:\n",y_test == y_predict)
#方法2:计算准确率
score = estimator.score(x_test,y_test)
print("准确率为:\n",score)
#最佳参数best_params
print("最佳参数:\n",estimator.best_params_)
# 最佳结果best_score
print("最佳结果:\n", estimator.best_score_)
#最佳估计器best_estimator_
print("最佳估计器:\n",estimator.best_estimator_)
return None
if name == ‘main’:
#代码1,用KNN算法对鸢尾花进行分类
#knn_iris()
#代码2,用KNN算法超参数网格搜索对鸢尾花进行分类
knn_iris_gsch()