Series对象
可以理解为带索引标签的一维数组
从数组创建
import numpy as np
import pandas as pd
a=np.array([0,1,2,3,4])
data=pd.Series(a)
print(data)
data=pd.Series(a,index=['a','b','c','d','e']) #自定义索引
print(data)
print(data['a'])
'''
运行结果
0 0
1 1
2 2
3 3
4 4
dtype: int32
a 0
b 1
c 2
d 3
e 4
dtype: int32
0
'''
从字典创建
a={'a':0,'b':1,'c':2,'d':3,'e':4}
data=pd.Series(a)
print(data)
'''
运行结果
a 0
b 1
c 2
d 3
e 4
dtype: int64
'''
其他创建方式
#等值创建
data=pd.Series(5,index=[0,1,2])
print(data)
#筛选创建(显式)
a={'a':0,'b':1,'c':2,'d':3,'e':4}
data=pd.Series(a,index=['b','d'])
print(data)
'''
运行结果
0 5
1 5
2 5
dtype: int64
b 1
d 3
dtype: int64
'''
属性
data=pd.Series(5,index=[0,1,2])
print(data.values)
print(data.index)
'''
运行结果
[5 5 5]
Int64Index([0, 1, 2], dtype='int64')
'''
DataFrame对象
可以看作一种有索引和列名的二维数组,也可看做是特殊字典。
从数组创建
#从二维数组创建
a=np.array([[90,92,93],
[60,75,87]])
data=pd.DataFrame(a,index=['Zhangfei','Guanyu'],
columns=['English','Chinese','Math'])
print(data)
'''
运行结果
English Chinese Math
Zhangfei 90 92 93
Guanyu 60 75 87
'''
从Series创建
#从Series创建
a1=pd.Series({'Zhangfei':90,'Guanyu':60})
a2=pd.Series({'Zhangfei':92,'Guanyu':75})
a3=pd.Series({'Zhangfei':93,'Guanyu':87})
data=pd.DataFrame(a1)
print(data)
data=pd.DataFrame({'English':a1,
'Chinese':a2,
'Math':a3})
print(data)
'''
运行结果
0
Zhangfei 90
Guanyu 60
English Chinese Math
Zhangfei 90 92 93
Guanyu 60 75 87
'''
从字典创建
#从字典创建
a={'English':(90,60),
'Chinese':(92,75),
'Math':(93,87)}
data=pd.DataFrame(a,index=('Zhangfei','Guanyu'))
print(data)
'''
运行结果
English Chinese Math
Zhangfei 90 92 93
Guanyu 60 75 87
'''
从Numpy结构化数组创建
#从Numpy结构化数组创建
datatype=np.dtype({
'names':('chinese','english','math'),
'formats':('i4','i4','i4')
})
a=np.array([(90,92,93),
(60,75,87)],dtype=datatype)
data=pd.DataFrame(a,index=['Zhangfei','Guanyu'])
print(data)
'''
运行结果
chinese english math
Zhangfei 90 92 93
Guanyu 60 75 87
'''
属性
a={'English':(90,60),
'Chinese':(92,75),
'Math':(93,87)}
data=pd.DataFrame(a,index=('Zhangfei','Guanyu'))
print(data)
print(data.values)
print(data.index)
print(data.columns)
'''
运行结果
English Chinese Math
Zhangfei 90 92 93
Guanyu 60 75 87
[[90 92 93]
[60 75 87]]
Index(['Zhangfei', 'Guanyu'], dtype='object')
Index(['English', 'Chinese', 'Math'], dtype='object')
'''
从文件导入
import pandas as pd
from pandas import Series, DataFrame
score = DataFrame(pd.read_excel('data.xlsx'))
score.to_excel('data1.xlsx')
print score