Pandas常用函数
一、导入数据
导入Pandas包和打印版本号
import pandas as pd
pd.__version__
从列表创建
s = pd.Series([0,1,2,3,4])
s
从字典创建
s = pd.Series({
'a':1,'b':2,'c':3,'d':4,'e':5})
s
从Numpy数组创建DataFrame
import numpy as np
s = pd.DataFrame(np.random.randn(3,4), index=pd.date_range('today',periods=3), columns = ['A','B','C','D'])
s
传入索引
s = pd.Series(['a','b','c','d'],index = [1,2,3,4])
s
指定行列索引
s = pd.DataFrame([['a','A'],['b','B'],['c','C'],['d','D']],columns = ["列一","列二"],index =["一","二","三","四"])
s
pd.read_csv导入文件数据
df = pd.read_excel(r"excel.xlsx",sheet_name = "Sheet1")
df = pd.read_excel(r"excel.xlsx",sheet_name = 0)
df = pd.read_excel(r"excel.xlsx",index_col = 0)
df = pd.read_excel(r"excel.xlsx",header = 0)
df = pd.read_excel(r"excel.xlsx",usecols = [0.3])
df = pd.read_csv(r"csv.csv",sep = ' ')
df = pd.read_csv(r"csv.csv",sep = ' ',nrows = 30)
df = pd.read_csv(r"csv.csv",sep = ' ',encoding = 'gbk')
df = pd.read_table(r"txt.txy",sep = " ")
head()查看前10行数据
df.head(10)
info()查看数据类型、缺失值
df.info()
describe()查看数据分布
df.describe()
columns查看列名称
df.columns
index查看索引