代码来源于邹博老师的教学课件,其中加入了自己的一点理解和注释。
使用pipeline形成的模型与随机森林模型的比较,发现使用后者预测的更准一些。
#!/usr/bin/python
# -*- coding:utf-8 -*-
import numpy as np
import matplotlib as mpl
import matplotlib.pyplot as plt
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import ElasticNetCV
import sklearn.datasets
from pprint import pprint
from sklearn.preprocessing import PolynomialFeatures, StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.metrics import mean_squared_error
from sklearn.ensemble import RandomForestRegressor
import warnings
def not_empty(s):
return s != ''
if __name__ == "__main__":
warnings.filterwarnings(action='ignore') #忽略警告信息
np.set_printoptio