通过KNN算法实现对乳腺癌数据集处理
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.datasets import load_breast_cancer
from sklearn.neighbors import KNeighborsClassifier
# 获取数据
breast_cancer = load_breast_cancer()
# 划分数据集
x_train, x_test, y_train, y_test = train_test_split(breast_cancer.data, breast_cancer.target, test_size=0.2, random_state=22)
# 数据预处理
transfer = StandardScaler()
x_train = transfer.fit_transform(x_train)
x_test = transfer.transform(x_test)
# 参数调优
param_grid = {'n_neighbors': [3, 5, 7]}
estimator = KNeighborsClassifier()
grid_search = GridSearchCV(estimator, param_grid=param_grid, cv=5)
grid_search.fit(x_train, y_train)
# 使用最佳参数的模型进行预测
best_estimator = grid_search.best_estimator_
acc = best_estimator.score(x_test, y_test)
print('测试集准确率: %.2f' % acc)
结果如下: