交叉验证及网格搜索
0. 加载相关模块
import numpy as np
import matplotlib.pyplot as plt
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
%matplotlib inline
1. 数据加载
iris = load_iris()
X = iris.data
y = iris.target
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=1/4, random_state=0)
print('数据集样本数:{},训练集样本数:{},测试集样本数:{}'.format(len(X), len(X_train), len(X_test)))
数据集样本数:150,训练集样本数:112,测试集样本数:38
2. 交叉验证
from sklearn.neighbors import KNeighborsClassifier
from sklearn.model_selection import cross_val_score
k_range = [1, 5, 9, 15]
cv_scores = []
for k in k_range:
knn = KNeighborsClassifier(n_neighbors<