机器学习002:简单线性回归
1、导入需要的库
import numpy as py
import pandas as pd
import matplotlib.pyplot as plt
2、数据预处理
dataset = pd.read_csv('studentscores.csv')
X = dataset.iloc[ : , : 1 ].values
Y = dataset.iloc[ : , 1 ].values
from sklearn.model_selection import train_test_split
X_train, X_test, Y_train, Y_test = train_test_split( X, Y, test_size = 0.25, random_state = 0)
3、模型训练
from sklearn.linear_model import LinearRegression
regressor = LinearRegression()
regressor = regressor.fit(X_train , Y_train)
4、结果预测
Y_pred = regressor.predict(X_test)
Y_pred
5、可视化
5.1 训练集结果可视化
plt.scatter(X_train ,Y_train ,color = 'red')
plt.plot(X_train , regressor.predict(X_train) ,color = 'blue')
plt.show()
5.2 测试集结果可视化
plt.scatter(X_test , Y_test ,c = 'r')
plt.plot(X_test , regressor.predict(X_test),c = 'b')
plt.show()
5.3查看系数
print('Coefficients: \n', regressor.coef_)