尝试用toad建评分卡
import pandas as pd
import numpy as np
import toad
from toad.plot import bin_plot
from toad.plot import badrate_plot
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from toad.metrics import KS, AUC, F1
from sklearn.metrics import roc_auc_score,roc_curve,auc
from toad.scorecard import ScoreCard
from matplotlib import pyplot as plt
1.导入数据,观察好坏比
data = pd.read_excel(r'l.xlsx')
print('Shape:',data.shape)
print('bad:',data['is_bad'].sum(),'good:',data['is_bad'].value_counts()[0])
2.数据eda
info = toad.detect(data) #数据分析
data.dropna(axis=0,how='any',inplace=True) #缺失值处理
t=['MD002', 'MD001', 'MD004', 'Z0009', 'BLK01', 'BLK02', 'BLK03', 'BLK04','BLK05']
for i in t:
data[i] = data[i].astype('str',copy=False)
3.划分数据集
data = data.iloc[:,1:] #去掉ID列
data_train,data_test = train_test_split(data,test_size=0.2