import numpy as np
import pandas as pd
path = "breast-cancer-wisconsin.data"
names = ['id','Clump Thickness','Uniformity of Cell Size','Uniformity of Cell Shape',
'Marginal Adhesion','Single Epithelial Cell Size','Bare Nuclei',
'Bland Chromatin','Normal Nucleoli','Mitoses','Class']
## 加载数据
data = pd.read_csv(path,na_values='?')
data.columns = names
## 删除为空的数据
data= data.dropna()
data.dtypes
# ## 使用过采样,进行类别平衡
print(data['Class'].value_counts())
appden_data = data[data['Class']==4][:-35]
data =data.append(appden_data)
## 提取X和
Y = data['Class']
X = data.drop(['Class'],axis=1,inplace=False)
## 标准化
from sklearn.preprocessing import StandardScaler
ssCoder = StandardScaler()
X_ss = ssCoder.fit_transform(X)
X = pd.DataFrame
LogisticRegression 预测分类
最新推荐文章于 2023-12-24 18:56:06 发布
本文探讨了如何在完成Logistic Regression训练后,将模型进行保存,并在后续使用中有效地加载,以便进行分类预测。内容涉及模型持久化的重要性和具体实现步骤。
摘要由CSDN通过智能技术生成