1,表的读取
prior = pd.read_csv("./data/prior.csv")
products = pd.read_csv("./data/products.csv")
2, 表的合并
_mg = pd.merge(prior, products, on=['product_id', 'product_id'])
3, 交叉表,特殊的分组表
cross = pd.crosstab(_mg['user_id'], _mg['aisle'])
4, 进行主成分分析
pca = PCA(n_components=0.9)
data = pca.fit_transform(cross)