算法篇
导包合集
**有监督学习算法
朴素贝叶斯算法
伯努利朴素贝叶斯
from sklearn.naive_bayes import BernoulliNB
高斯朴素贝叶斯
from sklearn.naive_bayes import GaussianNB
from sklearn.datasets import make_blobs
# **datasets**:意为数据集,make_blobs:产生随机数的数据集
from sklearn.model_selection import train_test_split
# **model_selection**:意为模型选择, train_test_split:数据集拆分
多项式朴素贝叶斯
import joblib # 保存模型
import jieba # 结巴分词
from sklearn.naive_bayes import MultinomialNB
from sklearn.datasets import load_breast_cancer # 癌症预测数据集
from sklearn.feature_extraction.text import CountVectorizer # 词频向量化
from sklearn.fearure_extraction.text import TfidfVectorizer # tfidf词频向量化
# **feature_extraction**:意为特征提取
逻辑回归算法
from sklearn.linear_model import LogisticRegression # 逻辑回归
from sklearn.preprocessing import StandardScaler # 标准差标准化
from sklearn.preprocessing import MaxAbsScaler # 小数定标标准化
from sklearn.preprocessing import MinMaxScaler # 离差标准化
# **preprocessing**:意为数据预处理
KNN算法
from sklearn.neighbors import KNeighborsClassifier # knn分类算法
from sklearn.neighbots import KNeighborsRegressor # knn回归算法
from sklearn.model_selection import cross_val_score # 交叉验证得分
from sklearn.model_selection import GridSearchCV # 网格搜索
from sklearn.model_selection import LeaveOneOut # 留一法
决策树算法
from sklearn.tree import DecisionTreeClassifier # 分类树
from sklearn.tree import DecisionTreeRegressor # 回归树
from sklearn.tree import export_graphviz # 导出树
随机森林算法
from sklearn.ensemble import RandomForestClassifier # 随机森林分类树
from sklearn.ensemble import RandomForestRegressor # 随机森林回归树
xgboost算法
# 安装 pip install xgboost
from xgboost import XGBClassifier # xgboost分类树
from xgboost import XGBRegressor # xgboost回归树
from xgboost import plot_tree # 自带树
from xgboost import to_graphviz # 导出dot文件
分类算法评估指标
from sklearn.metrics import confusion_matrix
# metrics:意为度量,返回四个值,查全和查准需要自己计算
from sklearn.metrics import precision_score # 查准率/精准率
from sklearn.metrics import recall_score # 查全率/召回率
from sklearn.metrics import f1_score # f1-score
from sklearn.metrics import classification_report # 分类报告
from sklearn.metrics import plot_precision_recall_curve # PR曲线
from sklearn.metrics import plot_roc_curve # ROC曲线
线性回归算法
from sklearn.linear_model import LinearRegression # 正规方程法
from sklearn.linear_model import SGDRegressor # 随机梯度下降法
**无监督学习算法
K-means算法
from sklearn.cluster import KMeans
from sklearn.metrics import silhouetee_score # 轮廓系数
如有不全,欢迎补充!!