/* 关联规则算法的实现 */
/* 读入关联数据,列代表项目集中的一个项目,行代表一个记录集,每行在某列上的值为0表示该记录集不含该项目,为1代表包含该项目 */
data test;
input id 1 class1 3 class2 5 class3 7 class4 9 class5 11 class6 13 class7 15 ;
cards;
1 0 0 1 1 0 1 0
2 1 0 0 1 0 1 1
3 0 1 1 0 1 1 0
4 1 1 0 1 0 1 1
5 0 1 1 1 0 1 0
6 0 0 0 1 0 1 1
;
run;
data items2;
set test;
length tid 8;
length item $8;
tid = _n_;
item = class1;
output;
item = class2;
output;
item = class3;
output;
item = class4;
output;
item = class5;
output;
item = class6;
output;
item = class7;
output;
keep tid item;
run;
proc sql;
alter table items2
modify item char(8);
quit;
/*关联分析*/
proc dmdb data=items2 dmdbcat=dbcat;
class tid item;
run; quit;
proc assoc data=items2 dmdbcat=dbcat pctsup=0.5 out=frequentItems;
id tid;
target item;
run;
proc rulegen in=frequentItems dmdbcat=dbcat out=rules minconf=80;
run ;
proc sort data=rules;
by descending conf;
run ;
/*只保留结果中包含生存变量的关联规则*/
data surviverules;
set rules(where=(set_size>1 and (_rhand=‘Yes’ or _rhand=‘No’)));
run;
proc print data=surviverules;
var conf support lift rule ;
run ;
SAS 关联规则
最新推荐文章于 2022-03-02 11:25:18 发布