import re
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.ensemble import RandomForestRegressor
from sklearn.pipeline import make_pipeline
from sklearn.ensemble import RandomForestClassifier
from sklearn.feature_selection import SelectKBest
import warnings
warnings.filterwarnings('ignore')%matplotlib inline
import pandas as pd
#查看这几个特征和生存之间的关系
features =['Sex','Pclass','SibSp','Parch','Embarked']
fig, saxis = plt.subplots(1,len(features),figsize=(len(features)*6,6))for ind, x inenumerate(features):print('Survival Correlation by:', x)print(train[[x,"Survived"]].groupby(x, as_index=False).mean())print('-'*10,'\n')#draw a bar plot of survival by sex
sns.barplot(x, y="Survived", data=train, ax = saxis[ind])
Survival Correlation by: Sex
Sex Survived
0 female 0.7420381 male 0.188908----------
Survival Correlation by: Pclass
Pclass Survived
010.629630120.472826230.242363----------
Survival Correlation by: SibSp
SibSp Survived
000.345395110.535885220.464286330.250000440.1666675