理论部分,已经记录在笔记上,就不打字了。。。
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from itertools import islice
from sklearn import linear_model
#-----------------------------------#
def getdata():
data_sets=[];response_sets=[];
file=open("D:/python_text/data_sets.txt",'r')
for line in islice(file, 1, None): #从第二行开始读
temp=(line.strip().split())
data_sets.append([float(temp[0])]) #记住,在进行回归分析的时候,x必须是多维数组,比如这样[[150.0,78], [200.0], [250.0]]
response_sets.append(float(temp[1]))
return ((data_sets),(response_sets))
def linear_mode_main(x_P,y_P):
regr=linear_model.LinearRegression()
regr.fit(x_P,y_P)
regression_coefficient={}
regression_coefficient['intercept']=regr.intercept_
regression_coefficient['coefficient']=regr.coef_
return regression_coefficient
X,Y=getdata()
result={}
result=linear_mode_main(X,Y)
print("Intercept value ", result['intercept'])
print("coefficient value ", result['coefficient'])