输入数据格式
25 52 164 240 274 328 368 448 538 561 630 687 730 775 825 834
39 120 124 205 401 581 704 814 825 834
35 249 674 712 733 759 854 950
39 422 449 704 825 857 895 937 954 964
15 229 262 283 294 352 381 708 738 766 853 883 966 978
具体函数解释
1. createC1(dataSet)
创建候选1项集,各item及其support存储在字典中
def createC1(dataSet):
C1_dict = {} # 物品清单
C1 = []
for items in dataSet:
for item in items:
if item in C1_dict:
C1_dict[item] += 1.; #数字当字典的key
else:
C1_dict[item] = 1.;
for key in C1_dict:
C1.append([key])
print("C1: ",C1)
return C1 #list(C1.keys()) 相等于 list(map(frozenset,C1))
# C1 = createC1(dataSet)
# print("C1:",C1) # C1: [[25], [52], [164], [240], [274]]
2. selectLk(dataSet,Ck,minSupport)
寻找k-频繁