实例一:餐厅订单数据分析
#先进行设置
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
plt.rcParams['font.sans-serif'] = ['Arial Unicode MS']#设置字体
%matplotlib inline
2.加载三个文件资料,将其合并和相应的删除处理
#1加载文件中的三个表
data1=pd.read_excel('meal_order_detail.xlsx',sheet_name='meal_order_detail1')
data2=pd.read_excel('meal_order_detail.xlsx',sheet_name='meal_order_detail2')
data3=pd.read_excel('meal_order_detail.xlsx',sheet_name='meal_order_detail3')
#2合并数据函数pd.concat()
data=pd.concat([data1,data2,data3],axis=0)
#‘axis=0’代表按照行链接数据,下方堆叠
#data.head(5)
data.dropna(axis=1,inplace=True)
#删除na列,axis=1代表按照列,inplace=True在原数据修改操作
data.info()
输出:
<class 'pandas.core.frame.DataFrame'> Int64Index: 10037 entries, 0 to 3610 Data columns (total 11 columns): # Column Non-Null Count Dtype --- ------ -------------- ----- 0 detail_id 10037 non-null int64 1 order_id 10037 non-null int64 2 dishes_id 10037 non-null int64 3 dishes_name 10037 non-null object 4 itemis_add 10037 non-null int64 5 counts 10037 non-null int64 6 amounts 10037 non-null int64 7 place_order_time 10037 non-null datetime64[ns] 8 add_inprice 10037 non-null int64 9 picture_file 10037 non-null object 10 emp_id