第1关:GBDT

from sklearn.ensemble import GradientBoostingClassifier
from sklearn.linear_model import SGDRegressor
from sklearn.pipeline import make_pipeline
from sklearn.preprocessing import StandardScaler
from xgboost import XGBClassifier
from xgboost import XGBRegressor
from sklearn.metrics import accuracy_score
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error
import xgboost as xgb

def gbc_t():
    data_url = "/data/workspace/myshixun/home/iris_train.csv"
    df = pd.read_csv(data_url)
    X = df.iloc[:,1:4]
    y = df.iloc[:,4]
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)
    #GradientBoostingClassifier:分类
    #预估值100,学习率1,最大深度1,随机数0
    clf = GradientBoostingClassifier(n_estimators=100, learning_rate=1.0, max_depth=1, random_state=0)
    clf.fit(X_train, y_train)
    acc_train = accuracy_score(y_train, clf.predict(X_train))
    acc_test = accuracy_score(y_test, clf.predict(X_test))
    return acc_train, acc_test

def make_p():
    train_csv ='/data/workspace/myshixun/home/train.csv'
    train_data = pd.read_csv(train_csv)
    train_data.drop(['Name','Sex','Ticket','Embarked','Cabin'],axis=1,inplace=True)
    train_data['Age'] = train_data['Age'].fillna(0)

    X = train_data.iloc[:,0:6]
    y = train_data.iloc[:,6]
    X_train, X_val, y_train, y_val = train_test_split(X.astype(float), y.astype(float), test_size=0.2, random_state=42)
    # make_pipeline(StandardScaler(),SGDRegressor())回归,参数默认就好
    reg = make_pipeline(StandardScaler(), SGDRegressor())
    reg.fit(X_train, y_train)
    y_val_pre = reg.predict(X_val)

    return mean_squared_error(y_val, y_val_pre )

def XGB_t():
    data_url = "/data/workspace/myshixun/home/iris_train.csv"
    df = pd.read_csv(data_url)
    X = df.iloc[:,1:4]
    y = df.iloc[:,4]
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)
    #XGBClassifier分类
    clf = XGBClassifier()
    clf.fit(X_train, y_train)
    acc_train = accuracy_score(y_train, clf.predict(X_train))
    acc_test = accuracy_score(y_test, clf.predict(X_test))
    return acc_train, acc_test

def xbg_r():
    train_csv = '/data/workspace/myshixun/home/train.csv'
    train_data = pd.read_csv(train_csv)

    train_data.drop(['Name', 'Sex', 'Ticket', 'Embarked', 'Cabin'], axis=1, inplace=True)
    train_data['Age'] = train_data['Age'].fillna(0)
    X = train_data.iloc[:, 0:6]
    y = train_data.iloc[:, 6]
    X_train, X_val, y_train, y_val = train_test_split(X, y, test_size=0.2, random_state=42)
    #XGBRegressor
    reg = XGBRegressor(max_depth=5, learning_rate=0.1, n_estimators=160, objective='reg:linear')
    reg.fit(X_train, y_train)
    y_val_pre = reg.predict(X_val)

    return mean_squared_error(y_val, y_val_pre)


  • 1
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 打赏
    打赏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

YLTommi

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值