|
@@ -4,7 +4,7 @@
|
4
|
4
|
from sklearn import tree
|
5
|
5
|
from sklearn.datasets import load_wine
|
6
|
6
|
from sklearn.model_selection import train_test_split
|
7
|
|
-
|
|
7
|
+import numpy
|
8
|
8
|
import graphviz
|
9
|
9
|
|
10
|
10
|
wine = load_wine()
|
|
@@ -18,12 +18,16 @@ print(wine.feature_names)
|
18
|
18
|
print(wine.target_names)
|
19
|
19
|
|
20
|
20
|
Xtrain, Xtest, Ytrain, Ytest = train_test_split(wine.data,wine.target,test_size=0.3)
|
21
|
|
-clf = tree.DecisionTreeClassifier(criterion="entropy")#实例化,criterion不写的话默认是基尼系数
|
|
21
|
+numpy.savetxt("foo.csv", Xtrain, delimiter=",")
|
|
22
|
+
|
|
23
|
+clf = tree.DecisionTreeClassifier(criterion="entropy", max_features=1, max_depth=5)#实例化,criterion不写的话默认是基尼系数
|
|
24
|
+# clf.n_features_ = 2
|
22
|
25
|
clf = clf.fit(Xtrain, Ytrain)
|
23
|
26
|
score = clf.score(Xtest, Ytest) #返回预测的准确度
|
24
|
27
|
print("score:", score)
|
25
|
28
|
|
26
|
|
-feature_name = ['酒精', '苹果酸', '灰', '灰的碱性', '镁', '总酚', '类黄酮', '非黄烷类酚类', '花青素', '颜色强度', '色调', 'od280/od315稀释葡萄酒', '脯氨酸']
|
|
29
|
+feature_name = ['酒精', '苹果酸', '灰', '灰的碱性', '镁', '总酚', '类黄酮',
|
|
30
|
+ '非黄烷类酚类', '花青素', '颜色强度', '色调', 'od280/od315稀释葡萄酒', '脯氨酸']
|
27
|
31
|
|
28
|
32
|
|
29
|
33
|
dot_data = tree.export_graphviz(clf
|
|
@@ -35,6 +39,6 @@ dot_data = tree.export_graphviz(clf
|
35
|
39
|
)
|
36
|
40
|
dot_data = dot_data.replace('helvetica', '"Microsoft YaHei"')
|
37
|
41
|
graph = graphviz.Source(dot_data)
|
38
|
|
-graph.render("Tree")
|
|
42
|
+graph.render("Tree1")
|
39
|
43
|
graph # graph.view()
|
40
|
44
|
|