代码
import numpy as np
from sklearn.model_selection import train_test_split
from numpy.linalg import inv
import matplotlib.pyplot as plt
data = np.loadtxt("D:/机器学习/data/aqi2.csv",delimiter=",",skiprows=1,dtype=float)
index = np.ones((data.shape[0],1))
data = np.hstack((data,index))
y = data[:,0]
x = data[:,1:]
X_train, X_test, y_train, y_test = train_test_split(
x, y, test_size=0.33, random_state=42)
weight = np.dot(np.dot(inv(np.dot(X_train.T,X_train)),X_train.T),y_train)
print(weight)
y_prediect = np.dot(X_test,weight)
plt.scatter(range(len(y_test)),y_test,c='red')
plt.plot(range(len(y_test)),y_prediect,c='black')
plt.show()
真实值与预测值图形的拟合结果结果: