import numpy as np import pandas as pd import matplotlib.pyplot as plt data = pd.read_csv('../data_test/Salary_Data.csv') x = data['YearsExperience'] y = data['Salary'] train_x = pd.DataFrame(x) train_y = y import sklearn.pipeline as pl #数据管线 import sklearn.preprocessing as sp #数据预处理 import sklearn.linear_model as lm model = pl.make_pipeline(sp.PolynomialFeatures(3), lm.LinearRegression()) model.fit(train_x,train_y) pred_y = model.predict(train_x) plt.scatter(x,y,s=50,color='dodgerblue') plt.plot(x,pred_y,color='orangered') ### 作业:拿到一部分数据,进行评估,寻找到最优的最高次幂