机器学习——决策树的应用

最新推荐文章于 2024-04-29 23:51:52 发布

HJ_Tan

最新推荐文章于 2024-04-29 23:51:52 发布

阅读量301

点赞数

分类专栏：机器学习文章标签：机器学习决策树 python

本文链接：https://blog.csdn.net/qq_41547057/article/details/80035374

版权

机器学习专栏收录该内容

2 篇文章 0 订阅

订阅专栏

from sklearn.feature_extraction import DictVectorizer
import csv
from sklearn import preprocessing
from sklearn import tree
from sklearn.externals.six import StringIO

#read in the csv file and put features in the list of class label
allElectronicsData=open(r'C:\Users\Administrator\Desktop\buy_computer.csv','r')
reader=csv.reader(allElectronicsData)
headers=reader.next()

print(headers)

featureList=[]
labelList=[]

for row in reader:
labelList.append(row[len(row)-1])
rowDict={}
for i in range(1,len(row)-1):
#print(row[i])
rowDict[headers[i]]=row[i]
#print("rowDict: ",rowDict)
featureList.append(rowDict)

print(featureList)

#Vetorize features
vec=DictVectorizer()
dummyX=vec.fit_transform(featureList).toarray()

print("dummyX:"+str(dummyX))
print(vec.get_feature_names())
print("labellist: "+str(labelList))

#Vectorize class labels
lb=preprocessing.LabelBinarizer()
dummyY=lb.fit_transform(labelList)
print("labelList: "+str(labelList))
print("dummyY: "+str(dummyY))

#Using decision tree for classification
#clf=tree.DecisiontreeClassifier()
clf=tree.DecisionTreeClassifier(criterion='entropy')
clf=clf.fit(dummyX,dummyY)
print("clf: "+str(clf))

#Visulise model
#with open("allElectronicGiniOri.dot",'w') as f;
with open("allElectronicInformationGainOri.dot",'w') as f:
# f=tree.export_graphviz(clf,out_file=f)
f=tree.export_graphviz(clf,feature_names=vec.get_feature_names(),out_file=f)

oneRowX=dummyX[0,:]
print("oneRowX: "+str(oneRowX))

newRowX=oneRowX

newRowX[0]=1
newRowX[2]=0
print("predictedY: "+str(newRowX))

predictedY=clf.predict(newRowX)
print("predictedY: "+str(predictedY))

HJ_Tan

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
机器学习——决策树的应用

from sklearn.feature_extraction import DictVectorizerimport csvfrom sklearn import preprocessingfrom sklearn import treefrom sklearn.externals.six import StringIO#read in the csv file and put features...
复制链接

扫一扫