import pandas as pd
df = pd.DataFrame({"学号": [1001,1002,1003,1004,1005],
"name": ["A","B","C","D","E"],
"生日": ["1990/01/02","1992/02/05","1990/05/06","1991/05/30","1992/05/03"],
"性别": ["boy","girl","girl","boy","girl"],
"数学": [56,67,47,87,47]
})
df.set_index("生日",inplace=True)
df.index=pd.to_datetime(df.index)
df
Out[1]:
In [2]:
df.add_prefix("x") #给列添加前缀
Out[2]:
In [3]:
df.add_suffix("x") #给列添加后缀
Out[3]:
In [4]:
df.align(df.drop(max(df.index))) #对齐
Out[4]:
In [5]:
df.drop(max(df.index)) #删除行
Out[5]:
In [6]:
df.drop_duplicates() #删除重复数据
Out[6]:
In [7]:
df.equals(df.drop(max(df.index))) #比较是否一样
Out[7]:
In [8]:
df.filter(items=["name"]) #选取子数据框
Out[8]:
In [ ]:
df.first() #不懂
In [10]:
df.head(2) #选取头2行元素
Out[10]:
In [ ]:
df.idxmax() #不懂
In [ ]:
df.idxmin() #不懂
In [ ]:
df.last() #不懂
In [11]:
df.drop(max(df.index)).reindex(df.index) #按照以前的索引从新索引
Out[11]:
In [12]:
df.drop(max(df.index)).reindex_axis(df.index) #从新索引
Out[12]:
In [13]:
df.drop(max(df.index)).reindex_like(df.drop(min(df.index))) #按照其他数据框索引
Out[13]:
In [14]:
df.rename(columns={"name":"Name"}) #更改列名
Out[14]:
In [15]:
df.rename_axis("name") #更改索引名
Out[15]:
In [16]:
df.reset_index() #重新索引
Out[16]:
In [17]:
df.sample(2) #随机抽样
Out[17]:
In [ ]:
df.select() #不懂
In [18]:
df.set_index("性别") #设置索引
Out[18]:
In [19]:
df.tail(3) #选取后3行元素
Out[19]:
In [20]:
df.take([1,2]) #绝对索引
Out[20]:
In [21]:
df.truncate() #不同
Out[21]:
In [22]:
df.sort_index() #按索引排序
Out[22]: