python-数据处理-合并表

# 1读取数据
#.2.合并表
#3.找到user_id和aisle_之间的关系
import pandas as pd
#1.获取数据
order_products=pd.read_csv("C:/Users/18578/Desktop/instacart/order_products__prior.csv")
products=pd.read_csv('C:/Users/18578/Desktop/instacart/products.csv')
orders=pd.read_csv('C:/Users/18578/Desktop/instacart/orders.csv')
aisles=pd.read_csv('C:/Users/18578/Desktop/instacart/aisles.csv')

tab1=pd.merge(aisles,products,on=["aisle_id","aisle_id"])

tab2=pd.merge(tab1,order_products,on=['product_id','product_id'])

tab3=pd.merge(tab2,orders,on=["order_id","order_id"])
tab3
aisle_idaisleproduct_idproduct_namedepartment_idorder_idadd_to_cart_orderreordereduser_ideval_setorder_numberorder_doworder_hour_of_daydays_since_prior_order
01prepared soups salads209Italian Pasta Salad209424650114082prior260201.0
11prepared soups salads22853Pesto Pasta Salad209424640114082prior260201.0
24instant foods12087Chicken Flavor Ramen Noodle Soup994246150114082prior260201.0
34instant foods47570Original Flavor Macaroni & Cheese Dinner994246141114082prior260201.0
413prepared meals10089Dolmas2094246250114082prior260201.0
.............................................
32434484134specialty wines champagnes47713Sparkling Rose530148721063218prior1114NaN
32434485134specialty wines champagnes49562Blanc De Noirs Sparkling Wine5345701137901prior133913.0
32434486134specialty wines champagnes49562Blanc De Noirs Sparkling Wine52509231126431prior2751110.0
32434487134specialty wines champagnes49562Blanc De Noirs Sparkling Wine513194021126431prior342147.0
32434488134specialty wines champagnes49562Blanc De Noirs Sparkling Wine522989861037901prior921113.0

32434489 rows × 14 columns

table=pd.crosstab(tab3['user_id'],tab3['aisle'])
data=table[:1000]
#PCSA 降维
from sklearn.decomposition import PCA
# 1) 实例化一个转换器类
transfer=PCA(n_components=0.95)
#2) 调用fit——transform 
data_new=transfer.fit_transform(data)
data_new.shape

(1000, 35)
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值