2018.1.8
clf = tree.DecisionTreeClassifier(criterion="entropy", max_depth=4)
clf = clf.fit(first_set, labels)
scores = cross_val_score(clf, first_set, labels, cv=10) # 10-means cross validate
print(scores)
# visualize
feature_name = ['balance', 'duration']
firstTree_dot = tree.export_graphviz(
clf
, out_file=None
, feature_names=feature_name
, class_names=['not_buy', 'buy']
)
graph = graphviz.Source(firstTree_dot)
graph.render("../output/TreeForBalanceAndDuration")