基于XGBoost的数据回归预测

导入包

from sklearn.model_selection import train_test_split
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.model_selection import GridSearchCV #网格搜索
import matplotlib.pyplot as plt#可视化
from sklearn.model_selection import KFold
from sklearn.metrics import r2_score
from sklearn.metrics import mean_squared_error
from scipy.stats import gaussian_kde
import xgboost as xgb
from sklearn.metrics import mean_absolute_error
from sklearn.preprocessing import MinMaxScaler
import pickle

import warnings
warnings.filterwarnings("ignore")

 导入数据

dataset = pd.read_excel('../dataset.xlsx')
dataset = dataset.drop('Unnamed: 0',axis=1)
dataset = dataset.dropna(axis=0)

十折交叉验证

# 十折交叉验证封装方法
def kfold_val(dataset,n_estimators,max_depth,learning_rate,min_child_weight):
    kf = KFold(n_splits=10,shuffle=True,random_state=True)
    for train_i,test_i in kf.split(dataset):
        x_train = dataset.iloc[train_i,5:]
        y_train=dataset.iloc[train_i,4]
        x_test=dataset.iloc[test_i,5:]
        y_test = dataset.iloc[test_i,4]
        model=xgb.XGBRegressor(n_estimators=n_estimators,max_depth =max_depth,learning_rate=learning_rate,min_child_weight=min_child_weight)  
        model.fit(x_train,y_train)
        y_pred = model.predict(x_test)
        mse=mse + mean_squared_error(y_pred,y_test)
        r2 =r2 + r2_score(y_pred,y_test)
    r2 = r2/10
    rmse = np.sqrt(mse)
    print('r2',r2)
    print('rmse',rmse)
kfold_val(dataset,1600,10,0.1,14)

可以确定好大范围后进行网格调参,最后进行画图

网格调参代码

parameters = {'n_estimators':[......],
              'max_depth': [......],
              'learning_rate':[.......],
              'min_child_weight':[......]
             }
model = xgb.XGBRegressor()
gsearch = GridSearchCV(model, param_grid=parameters, cv=2)
gsearch = gsearch.fit(x_train,y_train)
print("Best score: %0.3f" % gsearch.best_score_)
print("Best parameters set:")
best_parameters = gsearch.best_estimator_.get_params()
for param_name in sorted(parameters.keys()):
    print("\t%s: %r" % (param_name, best_parameters[param_name]))

评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值