1.导入模块
import numpy as np
import pandas as pd
from pandas import Series,DataFrame
import matplotlib.pyplot as plt
%matplotlib inline
#k近邻算法
from sklearn.neighbors import KNeighborsClassifier
#logistic回归算法
from sklearn.linear_model import LogisticRegression
#决策树
from sklearn.tree import DecisionTreeClassifier
#朴素贝叶斯-高斯分布
from sklearn.naive_bayes import GaussianNB
#向量机
from sklearn.svm import SVC
2.获取训练数据和预测数据
data = pd.read_csv('../day13/data/seeds.csv',delimiter='\t',header=None)
X_train=data.loc[:170,:6]
Y_train=data.loc[:170,7]
x_test = data.loc[170:,:6]
y_true = data.loc[170:,7]
数据如下:
3.创建模型
knn = KNeighborsClassifier(n_neighbors=3)
logistic = LogisticRegression()
decision=DecisionTreeClassifier(max_depth=5)
gauss=GaussianNB()
svc = SVC(kernel='rbf')
4.训练数据
knn.fit(X_train,Y_train)
logistic.fit(X_train,Y_train)
decision.fit(X_train,Y_train)
gauss.fit(X_train,Y_train)
svc.fit(X_train,Y_train)
5.评分
knn.score(x_test,y_true)
logistic.score(x_test,y_true)
decision.score(x_test,y_true)
gauss.score(x_test,y_true)
svc.score(x_test,y_true)