df['Age'][:5]'''
Name
Braund, Mr. Owen Harris 22.0
Cumings, Mrs. John Bradley (Florence Briggs Thayer) 38.0
Heikkinen, Miss. Laina 26.0
Futrelle, Mrs. Jacques Heath (Lily May Peel) 35.0
Allen, Mr. William Henry 35.0
Name: Age, dtype: float64
'''
age = df['Age']
age['Braund, Mr. Owen Harris']#22.0
age = age +5
age[:5]'''
Name
Braund, Mr. Owen Harris 27.0
Cumings, Mrs. John Bradley (Florence Briggs Thayer) 43.0
Heikkinen, Miss. Laina 31.0
Futrelle, Mrs. Jacques Heath (Lily May Peel) 40.0
Allen, Mr. William Henry 40.0
Name: Age, dtype: float64
'''
age.mean()#34.69911764705882
age.std()#14.526497332334042#age.max() age.min()#更全面直接的方式
df.describe()
Pandas索引结构
import pandas as pd
df = pd.read_csv('data/titanic.csv')#.head()可以读取前几条数据
df.head(6)
df[['Age','Fare']][:5]
loc:用label来定位
iloc:用position来定位
#iloc#获得五条数据0:5,但限制为两个属性1:3
df.iloc[0:5,1:3]
df1 = df.set_index('Name')
df1.loc['Braund, Mr. Owen Harris']'''
PassengerId 1
Survived 0
Pclass 3
Sex male
Age 22
SibSp 1
Parch 0
Ticket A/5 21171
Fare 7.25
Cabin NaN
Embarked S
Name: Braund, Mr. Owen Harris, dtype: object
'''
df1.loc['Braund, Mr. Owen Harris':'Allen, Mr. William Henry',:]
#赋值
df1 = df.set_index('Name')
df1.loc['Braund, Mr. Owen Harris','Fare']=1000
df1.head()
#bool类型索引
df = df.set_index('Name')
df['Fare']>40'''
Name
Braund, Mr. Owen Harris False
Cumings, Mrs. John Bradley (Florence Briggs Thayer) True
Heikkinen, Miss. Laina False
Futrelle, Mrs. Jacques Heath (Lily May Peel) True
Allen, Mr. William Henry False
...
Montvila, Rev. Juozas False
Graham, Miss. Margaret Edith False
Johnston, Miss. Catherine Helen "Carrie" False
Behr, Mr. Karl Howell False
Dooley, Mr. Patrick False
Name: Fare, Length: 891, dtype: bool
'''
df[df['Fare']>40]#见图1
df[df['Sex']=='male']#见图2