先使用随机逻辑回归模型筛选出几个分数较高的特征,然后用这些特征进行逻辑回归模型的训练,然后用来预测未来贷款人的可能违约情况。
数据:
待测数据:
测试代码:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.linear_model import LogisticRegression as LR
from sklearn.linear_model import RandomizedLogisticRegression as RLR
from sklearn.model_selection import train_test_split as tts
from pandas import DataFrame as df
def get_data(pathname='bankloan.xls'):
# 读入数据
try:
bank_data = pd.read_excel(pathname)
x = bank_data.iloc[:, :8]
y = bank_data.iloc[:, 8]
return x, y
except:
bank_data = pd.read_csv(pathname)
return bank_data
# 筛选特征值