for n in np.arange(50,300,10):
RF_clf = RandomForestClassifier(n_estimators=n);
cv_score = model_selection.cross_val_score(RF_clf, xtrain, ytrain, scoring=‘accuracy’,cv=10); # scoring=‘accuracy’ 正确率
n_estimators_score.append(cv_score.mean());
plt.figure();
plt.plot(np.arange(50,300,10),n_estimators_score);
plt.show();
输出
我们可以看到此时score在0.7825-0.801波动
在70左右取得较高的值
所有我们进一步 让n_estimators从60取到80 看看具体那一个值最好
这次我们直接用GridSearchCV
param_grid = {‘n_estimators’:range(60,80,1)};
rfc1 = model_selection.GridSearchCV(RandomForestClassifier(),param_grid=param_grid,cv=5);
rfc1.fit(xtrain,ytrain);
pri