封装好的方法
可以有可视化表达
有r2评分(前者为训练评价,后者为测试评价,越接近1越好)
from sklearn.preprocessing import PolynomialFeatures
from matplotlib import pyplot as plt
from sklearn.linear_model import LinearRegression
import numpy as np
from sklearn.metrics import r2_score
import pandas as pd
# degree是代表了几阶多项式
# x_train, y_train, x_test, y_test等数据自己准备
def polydemo(degree, x_train, y_train, x_test, y_test):
polyn = PolynomialFeatures(degree=degree)
x_train=np.array(x_train).reshape(-1,1)
x_test=np.array(x_test).reshape(-1,1)
x_n_train = polyn.fit_transform(x_train)
x_n_test = polyn.fit_transform(x_test)
lr = LinearRegression()
lr.fit(x_n_train, y_train)
y_n_train_predict = lr.predict(x_n_train)
y_n_test_predict = lr.predict(x_n_test)
r2_n_train = r2_score(y_train, y_n_train_predict)
r2_n_test = r2_score(y_test, y_n_test_predict)
print('training r2:', r2_n_train)
print('test r2:', r2_n_test)
# 可视化
x_2_range = np.linspace(40, 90, 300).reshape(-1, 1)
x_2_range = polyn.transform(x_2_range)
y_2_range_predict = lr.predict(x_2_range)
fig3 = plt.figure(figsize=(5, 5))
x_range = np.linspace(40, 90, 300).reshape(-1, 1)
plt.plot(x_range, y_2_range_predict)
plt.scatter(x_train, y_train)
plt.scatter(x_test, y_test)
plt.title('prediction data')
plt.xlabel('temperature')
plt.ylabel('rate')
plt.show()
data_train=pd.read_csv('T-R-train.csv')
x_train=data_train.loc[:,'T']
y_train=data_train.loc[:,'rate']
data_test=pd.read_csv('T-R-test.csv')
x_test=data_test.loc[:,'T']
y_test=data_test.loc[:,'rate']
polydemo(6,x_train,y_train,x_test, y_test)