#将DTdata.csv中的数据带入play_decision变量中,有header,分隔符为,
>
play_decision <-
read.table(
"DTdata.csv",
header =
TRUE,
sep =
",")
#查看数据
>
play_decision
Play
Outlook
Temperature
Humidity
Wind
1
yes
rainy
cool
normal
FALSE
2
no
rainy
cool
normal
TRUE
3
yes
overcast
hot
high
FALSE
4
no
sunny
mild
high
FALSE
5
yes
rainy
cool
normal
FALSE
6
yes
sunny
cool
normal
FALSE
7
yes
rainy
cool
normal
FALSE
8
yes
sunny
hot
normal
FALSE
9
yes
overcast
mild
high
TRUE
10
no
sunny
mild
high
TRUE
#用rpart函数生成决策树模型,基于4种属性来预测Play属性,method="class"表示构建分类树,data指定了包含属性的数据帧,control控制
树的增长minsplit=1要求每个节点在尝试分裂前必须要有至少一个观测值
>
fit <-
rpart(
Play
~
Outlook +
Temperature +
Humidity +
Wind ,
method =
"class" ,
data =
play_decision ,
control =
rpart.control(
minsplit =
1) ,
parms =
list(
split=
"information"</