Iris数据集包含鸢尾花三个亚属的分类信息,通过机器学习算法生成一个模型,自动分类新数据到三个亚属中的某一个。
#导入类库
import pandas as pd
from pandas.plotting import scatter_matrix
from sklearn import datasets
from sklearn.model_selection import KFold,train_test_split,cross_val_score
from sklearn.metrics import accuracy_score,confusion_matrix,classification_report
from sklearn.linear_model import LogisticRegression
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
from sklearn.neighbors import KNeighborsClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.naive_bayes import GaussianNB
from sklearn.svm import SVC
#导入数据集
iris = datasets.load_iris()
X = pd.DataFrame(iris.data,columns=iris.feature_names)
Y = pd.DataFrame(iris.target,columns=['class']).iloc[:,0]
#分离数据集
validation_size = 0.2
X_train,X_validation,Y_train,Y_validation = train_test_split(X,Y,test_size=validation_size,shuffle=True)
#创建模型
model