查看数据频率/分布 - 每个用户有行为的item数目
import numpy as np
import pylab as pl
#itemlen = [用户交互的item数]
data = np.array(itemlen)
bins = np.linspace(min(data),max(data),50)
pl.hist(data,bins)
pl.xlabel('Number of ×××')
pl.ylabel('Number of occurences')
pl.title('Frequency distribution of number of ×××s')
pl.show()