待定:是否需要数据标准化、异常值处理、模型单一
#TODO:
(1)修改开题报告(1.14前完成)☑️
(2)将数据集完善为2010-2020期间(1.20前完成)☑️
(3)控制变量较少、单一控制变量实验
(4)稳健性检验
python文件:/实证/OLS_test.py
import numpy as np
import pandas as pd
import statsmodels.api as sm
from sklearn import preprocessing
dataset = pd.read_excel('2010_test.xlsx')
x = dataset.iloc[:,3:]
# x[np.isnan(x)]=0
# x[np.isinf(x)]=0
x_scaled = preprocessing.MinMaxScaler().fit_transform(x)
# print(x_scaled)
VC = dataset.iloc[:,3]
y_esg = dataset.iloc[:,2]
lm = sm.OLS(y_esg, VC)
# lm = sm.OLS(y_esg, x)
model = lm.fit()
print(model.summary())