import pandas as pd
from sklearn.preprocessing import OneHotEncoder
from sklearn.preprocessing import PolynomialFeatures
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.linear_model import Ridge
path = "hour.csv"
data = pd.read_csv(path,na_values='?')## 删除无用的列
data.drop(["casual","registered","dteday"],axis=1,inplace=True)
data.head()
## 检查哪些特征需要做独热编码
# seasson mnth hr holiday weekday
data_trans = data[["season","mnth","hr","weekday"]]
## 独热编码,对需要进行独热编码的列编码
hotCoder = OneHotEncoder(sparse=False,handle_unknown='ignore')
hot=hotCoder.fit_transform(data_trans)
data_trans_hot = pd.DataFrame(hot)
# print(data.head)
# 删除掉独热编码的列
data.drop(["season","mnth","hr","weekday"],axis
LinearRegression 预测
最新推荐文章于 2024-07-11 17:53:22 发布
本文深入探讨了线性回归模型在预测分析中的使用。通过解释线性回归的基本原理,包括最小二乘法和预测变量之间的关系,展示了如何构建和评估线性回归模型。此外,还讨论了线性回归在实际问题中解决预测挑战的有效性,并提供了一个实例来说明其在预测任务中的应用。
摘要由CSDN通过智能技术生成