数据初识

import pandas as pd
stations = pd.read_csv('stations.csv',encoding='utf-8')
print(stations.head())
#     id     name   lat  long  docks        city
# 0  1.0  '#SAN#'  37.3  -121   27.0  'San Jose'
# 1  1.0  '#SAN#'  37.3  -121   27.0  'San Jose'
# 2  1.0  '#SAN#'  37.3  -121   27.0  'San Jose'
# 3  1.0  '#SAN#'  37.3  -121   27.0  'San Jose'
# 4  1.0  '#SAN#'  37.3  -121   27.0  'San Jose'

trips1 = pd.read_csv('trips1.csv',encoding='utf-8')
print(trips1.shape)
# (6, 5)

trips2 = pd.read_csv('trips2.csv',encoding='utf-8')
print(trips1.shape)
# (6, 5)

trips3 = pd.read_csv('trips3.csv',encoding='utf-8')
print(trips1.shape)
# (6, 5)

#将trips1、trips2、trips3合并为一个Dataframe,命名为trips
trips = pd.concat([trips1,trips2,trips3])
# print(trips.shape)
# (18, 5)

#将stations中所有列名称前添加字段‘start_’,并将start_id设置为列索引
stations.columns = stations.columns.map(lambda x:'start_'+x)
#inplace为true时,对原数据进行修改
# stations.set_index(['start_id'],inplace=True)
print('stations----')
print(stations)


print('-----trips-----')
print(trips)
#将trips和stations按照起始车站id进行字段匹配并合并,保留所有匹配成功的信息
print('----合并后----')
trips_stations = trips.merge(stations,on='start_id'))
print(trips_stations)

#将trips_stations导出为'将'trips_stations.csv'文件

trips_stations.to_csv('trips_stations.csv')

 

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值