python 分类器有哪些_sklearn常见分类器的效果比较-CSDN博客

importnumpy as npimportmatplotlib.pyplot as pltfrom matplotlib.colors importListedColormap#from sklearn.model_selection import train_test_split #废弃！！

from sklearn.cross_validation importtrain_test_splitfrom sklearn.preprocessing importStandardScalerfrom sklearn.datasets importmake_moons, make_circles, make_classificationfrom sklearn.neural_network importBernoulliRBMfrom sklearn.neighbors importKNeighborsClassifierfrom sklearn.svm importSVCfrom sklearn.gaussian_process importGaussianProcessfrom sklearn.tree importDecisionTreeClassifierfrom sklearn.ensemble importRandomForestClassifier, AdaBoostClassifierfrom sklearn.naive_bayes importGaussianNBfrom sklearn.discriminant_analysis importQuadraticDiscriminantAnalysis

h= .02 #step size in the mesh

names= ["Nearest Neighbors", "Linear SVM", "RBF SVM","Decision Tree", "Random Forest", "AdaBoost","Naive Bayes", "QDA", "Gaussian Process","Neural Net", ]

classifiers=[

KNeighborsClassifier(3),

SVC(kernel="linear", C=0.025),

SVC(gamma=2, C=1),

DecisionTreeClassifier(max_depth=5),

RandomForestClassifier(max_depth=5, n_estimators=10, max_features=1),

AdaBoostClassifier(),

GaussianNB(),

QuadraticDiscriminantAnalysis(),#GaussianProcess(),

#BernoulliRBM(),

]

X, y= make_classification(n_features=2, n_redundant=0, n_informative=2,

random_state=1, n_clusters_per_class=1)

rng= np.random.RandomState(2)

X+= 2 * rng.uniform(size=X.shape)

linearly_separable=(X, y)

datasets= [make_moons(noise=0.3, random_state=0),

make_circles(noise=0.2, factor=0.5, random_state=1),

linearly_separable

]

figure= plt.figure(figsize=(27, 9))

i= 1

#iterate over datasets

for ds_cnt, ds inenumerate(datasets):#preprocess dataset, split into training and test part

X, y =ds

X=StandardScaler().fit_transform(X)

X_train, X_test, y_train, y_test=\

train_test_split(X, y, test_size=.4, random_state=42)

x_min, x_max= X[:, 0].min() - .5, X[:, 0].max() + .5y_min, y_max= X[:, 1].min() - .5, X[:, 1].max() + .5xx, yy=np.meshgrid(np.arange(x_min, x_max, h),

np.arange(y_min, y_max, h))#just plot the dataset first

cm =plt.cm.RdBu

cm_bright= ListedColormap(['#FF0000', '#0000FF'])

ax= plt.subplot(len(datasets), len(classifiers) + 1, i)if ds_cnt ==0:

ax.set_title("Input data")#Plot the training points

ax.scatter(X_train[:, 0], X_train[:, 1], c=y_train, cmap=cm_bright)#and testing points

ax.scatter(X_test[:, 0], X_test[:, 1], c=y_test, cmap=cm_bright, alpha=0.6)

ax.set_xlim(xx.min(), xx.max())

ax.set_ylim(yy.min(), yy.max())

ax.set_xticks(())

ax.set_yticks(())

i+= 1