dt1 = pd.date_range(start=‘20190101’, periods=3)
dt2=pd.to_datetime(‘01/01/2019’)
dt3=pd.to_datetime([‘01/01/2019’])
dt1, dt2, dt3的数据类型分别是:
DatetimeIndex, Timestamp, DatetimeIndex
第四课 Pandas时序型数据分析
第二节 时间戳索引
import pandas as pd
date_range
pd.date_range(start='2019-01-01', end='2019-02-01')
DatetimeIndex(['2019-01-01', '2019-01-02', '2019-01-03', '2019-01-04',
'2019-01-05', '2019-01-06', '2019-01-07', '2019-01-08',
'2019-01-09', '2019-01-10', '2019-01-11', '2019-01-12',
'2019-01-13', '2019-01-14', '2019-01-15', '2019-01-16',
'2019-01-17', '2019-01-18', '2019-01-19', '2019-01-20',
'2019-01-21', '2019-01-22', '2019-01-23', '2019-01-24',
'2019-01-25', '2019-01-26', '2019-01-27', '2019-01-28',
'2019-01-29', '2019-01-30', '2019-01-31', '2019-02-01'],
dtype='datetime64[ns]', freq='D')
# 读取数据
data_df = pd.read_csv('./datasets/BeijingPM20100101_20151231.csv')
data_df.head()
No year month day hour season PM_Dongsi PM_Dongsihuan PM_Nongzhanguan PM_US Post DEWP HUMI PRES TEMP cbwd Iws precipitation Iprec
0 1 2010 1 1 0 4 NaN NaN NaN NaN -21.0 43.0 1021.0 -11.0 NW 1.79 0.0 0.0
1 2 2010 1 1 1 4 NaN NaN NaN NaN -21.0 47.0 1020.0 -12.0 NW 4.92 0.0 0.0
2 3 2010 1 1 2 4 NaN NaN NaN NaN -21.0 43.0 1019.0 -11.0 NW 6.71 0.0 0.0
3 4 2010 1 1 3 4 NaN NaN NaN NaN -21.0 55.0 1019.0 -14.0 NW 9.84 0.0 0.0
4 5 2010 1 1 4 4 NaN NaN NaN NaN -20.0 51.0 1018.0 -12.0 NW 12.97 0.0 0.0
# 设置时间戳为索引
data_df.index = pd.to_datetime(data_df[['year', 'month', 'day']])
data_df.head()
No year month day hour season PM_Dongsi PM_Dongsihuan PM_Nongzhanguan PM_US Post DEWP HUMI PRES TEMP cbwd Iws precipitation Iprec
2010-01-01 1 2010 1 1 0 4 NaN NaN NaN NaN -21.0 43.0 1021.0 -11.0 NW 1.79 0.0 0.0
2010-01-01 2 2010 1 1 1 4 NaN NaN NaN NaN -21.0 47.0 1020.0 -12.0 NW 4.92 0.0 0.0
2010-01-01 3 2010 1 1 2 4 NaN NaN NaN NaN -21.0 43.0 1019.0 -11.0 NW 6.71 0.0 0.0
2010-01-01 4 2010 1 1 3 4 NaN NaN NaN NaN -21.0 55.0 1019.0 -14.0 NW 9.84 0.0 0.0
2010-01-01 5 2010 1 1 4 4 NaN NaN NaN NaN -20.0 51.0 1018.0 -12.0 NW 12.97 0.0 0.0
data_df.index
DatetimeIndex(['2010-01-01', '2010-01-01', '2010-01-01', '