from sklearn.datasets import load_boston
boston = load_boston()
from sklearn.cross_validation import train_test_split
import numpy as np;
X = boston.data
y = boston.target
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state = 33, test_size = 0.25)
print 'The max target value is: ', np.max(boston.target)
print 'The min target value is: ', np.min(boston.target)
print 'The average terget value is: ', np.mean(boston.target)
from sklearn.preprocessing import StandardScaler
ss_X = StandardScaler()
ss_y = StandardScaler()
X_train = ss_X.fit_transform(X_train)
X_test = ss_X.transform(X_test)
y_train = ss_y.fit_transform(y_train)
y_test = ss_y.transform(y_test)
from sklearn.ensemble import RandomForestRegressor, ExtraTreesRegressor, GradientBoostingRegressor
rfr = RandomForestRegressor()
rfr.fit(X_test, y_test)
rfr_y_predict = rfr.predict(X_test)
etr
python实现集成回归算法,包括随机森林,极端随机森林,梯度boosting算法
最新推荐文章于 2024-08-22 09:38:43 发布
该博客通过Python展示了如何使用sklearn库实现集成学习中的随机森林、极端随机森林和梯度提升回归算法。首先,加载波士顿房价数据集,然后进行数据预处理,包括训练集和测试集划分以及标准化操作。接着分别训练三种回归模型,并计算它们的R-squared分数、均方误差和平均绝对误差,以评估模型性能。
摘要由CSDN通过智能技术生成