forked from dodgy719/Decisions_with_ML
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdtree.dot
217 lines (217 loc) · 14.9 KB
/
dtree.dot
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
digraph Tree {
node [shape=box, style="filled, rounded", color="black", fontname=helvetica] ;
edge [fontname=helvetica] ;
0 [label=<marital_status_Married ≤ 0.5<br/>gini = 0.5<br/>samples = 750<br/>value = [375.0, 375.0]<br/>class = Less than $50k>, fillcolor="#ffffff"] ;
1 [label=<education_Bachelors ≤ 0.5<br/>gini = 0.27<br/>samples = 299<br/>value = [246.429, 47.26]<br/>class = Over $50k>, fillcolor="#ea995f"] ;
0 -> 1 [labeldistance=2.5, labelangle=45, headlabel="True"] ;
2 [label=<hours_per_week ≤ 49.0<br/>gini = 0.195<br/>samples = 258<br/>value = [225.0, 27.74]<br/>class = Over $50k>, fillcolor="#e89151"] ;
1 -> 2 ;
3 [label=<occupation_Professional ≤ 0.5<br/>gini = 0.119<br/>samples = 215<br/>value = [196.753, 13.356]<br/>class = Over $50k>, fillcolor="#e78a46"] ;
2 -> 3 ;
4 [label=<age ≤ 53.5<br/>gini = 0.081<br/>samples = 199<br/>value = [186.039, 8.219]<br/>class = Over $50k>, fillcolor="#e68742"] ;
3 -> 4 ;
5 [label=<age ≤ 24.5<br/>gini = 0.056<br/>samples = 181<br/>value = [171.429, 5.137]<br/>class = Over $50k>, fillcolor="#e6853f"] ;
4 -> 5 ;
6 [label=<gini = 0.0<br/>samples = 74<br/>value = [72.078, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
5 -> 6 ;
7 [label=<age ≤ 26.5<br/>gini = 0.093<br/>samples = 107<br/>value = [99.351, 5.137]<br/>class = Over $50k>, fillcolor="#e68843"] ;
5 -> 7 ;
8 [label=<gini = 0.288<br/>samples = 12<br/>value = [9.74, 2.055]<br/>class = Over $50k>, fillcolor="#ea9c63"] ;
7 -> 8 ;
9 [label=<gini = 0.064<br/>samples = 95<br/>value = [89.61, 3.082]<br/>class = Over $50k>, fillcolor="#e68540"] ;
7 -> 9 ;
10 [label=<education_Masters ≤ 0.5<br/>gini = 0.288<br/>samples = 18<br/>value = [14.61, 3.082]<br/>class = Over $50k>, fillcolor="#ea9c63"] ;
4 -> 10 ;
11 [label=<occupation_Sales ≤ 0.5<br/>gini = 0.216<br/>samples = 17<br/>value = [14.61, 2.055]<br/>class = Over $50k>, fillcolor="#e99355"] ;
10 -> 11 ;
12 [label=<gini = 0.13<br/>samples = 15<br/>value = [13.636, 1.027]<br/>class = Over $50k>, fillcolor="#e78a48"] ;
11 -> 12 ;
13 [label=<gini = 0.5<br/>samples = 2<br/>value = [0.974, 1.027]<br/>class = Less than $50k>, fillcolor="#f5fafe"] ;
11 -> 13 ;
14 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.0, 1.027]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
10 -> 14 ;
15 [label=<hours_per_week ≤ 33.5<br/>gini = 0.438<br/>samples = 16<br/>value = [10.714, 5.137]<br/>class = Over $50k>, fillcolor="#f1bd98"] ;
3 -> 15 ;
16 [label=<gini = 0.0<br/>samples = 4<br/>value = [3.896, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
15 -> 16 ;
17 [label=<hours_per_week ≤ 38.0<br/>gini = 0.49<br/>samples = 12<br/>value = [6.818, 5.137]<br/>class = Over $50k>, fillcolor="#f9e0ce"] ;
15 -> 17 ;
18 [label=<gini = 0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
17 -> 18 ;
19 [label=<age ≤ 53.5<br/>gini = 0.429<br/>samples = 10<br/>value = [6.818, 3.082]<br/>class = Over $50k>, fillcolor="#f1ba93"] ;
17 -> 19 ;
20 [label=<gini = 0.254<br/>samples = 7<br/>value = [5.844, 1.027]<br/>class = Over $50k>, fillcolor="#ea975c"] ;
19 -> 20 ;
21 [label=<gini = 0.436<br/>samples = 3<br/>value = [0.974, 2.055]<br/>class = Less than $50k>, fillcolor="#97cbf1"] ;
19 -> 21 ;
22 [label=<age ≤ 57.5<br/>gini = 0.447<br/>samples = 43<br/>value = [28.247, 14.384]<br/>class = Over $50k>, fillcolor="#f2c19e"] ;
2 -> 22 ;
23 [label=<education_Doctorate ≤ 0.5<br/>gini = 0.423<br/>samples = 41<br/>value = [28.247, 12.329]<br/>class = Over $50k>, fillcolor="#f0b88f"] ;
22 -> 23 ;
24 [label=<marital_status_Single ≤ 0.5<br/>gini = 0.378<br/>samples = 37<br/>value = [27.273, 9.247]<br/>class = Over $50k>, fillcolor="#eeac7c"] ;
23 -> 24 ;
25 [label=<age ≤ 40.5<br/>gini = 0.493<br/>samples = 14<br/>value = [7.792, 6.164]<br/>class = Over $50k>, fillcolor="#fae5d6"] ;
24 -> 25 ;
26 [label=<gini = 0.228<br/>samples = 8<br/>value = [6.818, 1.027]<br/>class = Over $50k>, fillcolor="#e99457"] ;
25 -> 26 ;
27 [label=<gini = 0.268<br/>samples = 6<br/>value = [0.974, 5.137]<br/>class = Less than $50k>, fillcolor="#5fb0ea"] ;
25 -> 27 ;
28 [label=<education_Masters ≤ 0.5<br/>gini = 0.236<br/>samples = 23<br/>value = [19.481, 3.082]<br/>class = Over $50k>, fillcolor="#e99558"] ;
24 -> 28 ;
29 [label=<gini = 0.11<br/>samples = 18<br/>value = [16.558, 1.027]<br/>class = Over $50k>, fillcolor="#e78945"] ;
28 -> 29 ;
30 [label=<gini = 0.485<br/>samples = 5<br/>value = [2.922, 2.055]<br/>class = Over $50k>, fillcolor="#f7dac4"] ;
28 -> 30 ;
31 [label=<workclass_Private ≤ 0.5<br/>gini = 0.365<br/>samples = 4<br/>value = [0.974, 3.082]<br/>class = Less than $50k>, fillcolor="#78bced"] ;
23 -> 31 ;
32 [label=<age ≤ 34.5<br/>gini = 0.5<br/>samples = 2<br/>value = [0.974, 1.027]<br/>class = Less than $50k>, fillcolor="#f5fafe"] ;
31 -> 32 ;
33 [label=<gini = 0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
32 -> 33 ;
34 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.0, 1.027]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
32 -> 34 ;
35 [label=<gini = 0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
31 -> 35 ;
36 [label=<gini = 0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
22 -> 36 ;
37 [label=<hours_per_week ≤ 46.5<br/>gini = 0.499<br/>samples = 41<br/>value = [21.429, 19.521]<br/>class = Over $50k>, fillcolor="#fdf4ed"] ;
1 -> 37 ;
38 [label=<occupation_Service ≤ 0.5<br/>gini = 0.452<br/>samples = 30<br/>value = [19.481, 10.274]<br/>class = Over $50k>, fillcolor="#f3c3a1"] ;
37 -> 38 ;
39 [label=<hours_per_week ≤ 32.5<br/>gini = 0.466<br/>samples = 28<br/>value = [17.532, 10.274]<br/>class = Over $50k>, fillcolor="#f4cbad"] ;
38 -> 39 ;
40 [label=<gini = 0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
39 -> 40 ;
41 [label=<age ≤ 22.5<br/>gini = 0.473<br/>samples = 27<br/>value = [16.558, 10.274]<br/>class = Over $50k>, fillcolor="#f5cfb4"] ;
39 -> 41 ;
42 [label=<gini = 0.0<br/>samples = 1<br/>value = [0.0, 1.027]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
41 -> 42 ;
43 [label=<occupation_Professional ≤ 0.5<br/>gini = 0.46<br/>samples = 26<br/>value = [16.558, 9.247]<br/>class = Over $50k>, fillcolor="#f4c7a8"] ;
41 -> 43 ;
44 [label=<gini = 0.491<br/>samples = 19<br/>value = [10.714, 8.219]<br/>class = Over $50k>, fillcolor="#f9e2d1"] ;
43 -> 44 ;
45 [label=<gini = 0.254<br/>samples = 7<br/>value = [5.844, 1.027]<br/>class = Over $50k>, fillcolor="#ea975c"] ;
43 -> 45 ;
46 [label=<gini = 0.0<br/>samples = 2<br/>value = [1.948, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
38 -> 46 ;
47 [label=<age ≤ 26.0<br/>gini = 0.287<br/>samples = 11<br/>value = [1.948, 9.247]<br/>class = Less than $50k>, fillcolor="#63b2ea"] ;
37 -> 47 ;
48 [label=<gini = 0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
47 -> 48 ;
49 [label=<hours_per_week ≤ 57.5<br/>gini = 0.172<br/>samples = 10<br/>value = [0.974, 9.247]<br/>class = Less than $50k>, fillcolor="#4ea7e8"] ;
47 -> 49 ;
50 [label=<gini = 0.0<br/>samples = 6<br/>value = [0.0, 6.164]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
49 -> 50 ;
51 [label=<occupation_Professional ≤ 0.5<br/>gini = 0.365<br/>samples = 4<br/>value = [0.974, 3.082]<br/>class = Less than $50k>, fillcolor="#78bced"] ;
49 -> 51 ;
52 [label=<gini = 0.0<br/>samples = 3<br/>value = [0.0, 3.082]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
51 -> 52 ;
53 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
51 -> 53 ;
54 [label=<education_School ≤ 0.5<br/>gini = 0.405<br/>samples = 451<br/>value = [128.571, 327.74]<br/>class = Less than $50k>, fillcolor="#87c3ef"] ;
0 -> 54 [labeldistance=2.5, labelangle=-45, headlabel="False"] ;
55 [label=<occupation_White-Collar ≤ 0.5<br/>gini = 0.367<br/>samples = 417<br/>value = [102.273, 320.548]<br/>class = Less than $50k>, fillcolor="#78bced"] ;
54 -> 55 ;
56 [label=<education_HS-grad ≤ 0.5<br/>gini = 0.432<br/>samples = 290<br/>value = [92.532, 200.342]<br/>class = Less than $50k>, fillcolor="#94caf1"] ;
55 -> 56 ;
57 [label=<hours_per_week ≤ 33.5<br/>gini = 0.352<br/>samples = 185<br/>value = [42.857, 144.863]<br/>class = Less than $50k>, fillcolor="#74baed"] ;
56 -> 57 ;
58 [label=<age ≤ 78.0<br/>gini = 0.452<br/>samples = 15<br/>value = [9.74, 5.137]<br/>class = Over $50k>, fillcolor="#f3c3a1"] ;
57 -> 58 ;
59 [label=<occupation_Sales ≤ 0.5<br/>gini = 0.365<br/>samples = 13<br/>value = [9.74, 3.082]<br/>class = Over $50k>, fillcolor="#eda978"] ;
58 -> 59 ;
60 [label=<gini = 0.288<br/>samples = 12<br/>value = [9.74, 2.055]<br/>class = Over $50k>, fillcolor="#ea9c63"] ;
59 -> 60 ;
61 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.0, 1.027]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
59 -> 61 ;
62 [label=<gini = -0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
58 -> 62 ;
63 [label=<age ≤ 24.5<br/>gini = 0.31<br/>samples = 170<br/>value = [33.117, 139.726]<br/>class = Less than $50k>, fillcolor="#68b4eb"] ;
57 -> 63 ;
64 [label=<gini = 0.0<br/>samples = 2<br/>value = [1.948, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
63 -> 64 ;
65 [label=<age ≤ 37.5<br/>gini = 0.298<br/>samples = 168<br/>value = [31.169, 139.726]<br/>class = Less than $50k>, fillcolor="#65b3eb"] ;
63 -> 65 ;
66 [label=<gini = 0.409<br/>samples = 57<br/>value = [16.558, 41.096]<br/>class = Less than $50k>, fillcolor="#89c4ef"] ;
65 -> 66 ;
67 [label=<gini = 0.225<br/>samples = 111<br/>value = [14.61, 98.63]<br/>class = Less than $50k>, fillcolor="#56ace9"] ;
65 -> 67 ;
68 [label=<age ≤ 60.5<br/>gini = 0.498<br/>samples = 105<br/>value = [49.675, 55.479]<br/>class = Less than $50k>, fillcolor="#eaf5fc"] ;
56 -> 68 ;
69 [label=<age ≤ 43.5<br/>gini = 0.491<br/>samples = 92<br/>value = [39.935, 52.397]<br/>class = Less than $50k>, fillcolor="#d0e8f9"] ;
68 -> 69 ;
70 [label=<age ≤ 31.5<br/>gini = 0.494<br/>samples = 53<br/>value = [29.221, 23.63]<br/>class = Over $50k>, fillcolor="#fae7d9"] ;
69 -> 70 ;
71 [label=<gini = 0.436<br/>samples = 15<br/>value = [4.87, 10.274]<br/>class = Less than $50k>, fillcolor="#97cbf1"] ;
70 -> 71 ;
72 [label=<gini = 0.457<br/>samples = 38<br/>value = [24.351, 13.356]<br/>class = Over $50k>, fillcolor="#f3c6a6"] ;
70 -> 72 ;
73 [label=<hours_per_week ≤ 75.0<br/>gini = 0.395<br/>samples = 39<br/>value = [10.714, 28.767]<br/>class = Less than $50k>, fillcolor="#83c2ef"] ;
69 -> 73 ;
74 [label=<gini = 0.378<br/>samples = 38<br/>value = [9.74, 28.767]<br/>class = Less than $50k>, fillcolor="#7cbeee"] ;
73 -> 74 ;
75 [label=<gini = 0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
73 -> 75 ;
76 [label=<hours_per_week ≤ 62.5<br/>gini = 0.365<br/>samples = 13<br/>value = [9.74, 3.082]<br/>class = Over $50k>, fillcolor="#eda978"] ;
68 -> 76 ;
77 [label=<age ≤ 66.5<br/>gini = 0.288<br/>samples = 12<br/>value = [9.74, 2.055]<br/>class = Over $50k>, fillcolor="#ea9c63"] ;
76 -> 77 ;
78 [label=<gini = 0.188<br/>samples = 10<br/>value = [8.766, 1.027]<br/>class = Over $50k>, fillcolor="#e89050"] ;
77 -> 78 ;
79 [label=<gini = 0.5<br/>samples = 2<br/>value = [0.974, 1.027]<br/>class = Less than $50k>, fillcolor="#f5fafe"] ;
77 -> 79 ;
80 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.0, 1.027]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
76 -> 80 ;
81 [label=<age ≤ 29.0<br/>gini = 0.139<br/>samples = 127<br/>value = [9.74, 120.205]<br/>class = Less than $50k>, fillcolor="#49a5e7"] ;
55 -> 81 ;
82 [label=<hours_per_week ≤ 55.0<br/>gini = 0.452<br/>samples = 6<br/>value = [3.896, 2.055]<br/>class = Over $50k>, fillcolor="#f3c3a1"] ;
81 -> 82 ;
83 [label=<gini = 0.0<br/>samples = 3<br/>value = [2.922, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
82 -> 83 ;
84 [label=<workclass_Private ≤ 0.5<br/>gini = 0.436<br/>samples = 3<br/>value = [0.974, 2.055]<br/>class = Less than $50k>, fillcolor="#97cbf1"] ;
82 -> 84 ;
85 [label=<gini = 0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
84 -> 85 ;
86 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
84 -> 86 ;
87 [label=<hours_per_week ≤ 63.0<br/>gini = 0.09<br/>samples = 121<br/>value = [5.844, 118.151]<br/>class = Less than $50k>, fillcolor="#43a2e6"] ;
81 -> 87 ;
88 [label=<hours_per_week ≤ 27.5<br/>gini = 0.076<br/>samples = 120<br/>value = [4.87, 118.151]<br/>class = Less than $50k>, fillcolor="#41a1e6"] ;
87 -> 88 ;
89 [label=<hours_per_week ≤ 22.5<br/>gini = 0.436<br/>samples = 3<br/>value = [0.974, 2.055]<br/>class = Less than $50k>, fillcolor="#97cbf1"] ;
88 -> 89 ;
90 [label=<gini = 0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
89 -> 90 ;
91 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
89 -> 91 ;
92 [label=<education_Some-college ≤ 0.5<br/>gini = 0.063<br/>samples = 117<br/>value = [3.896, 116.096]<br/>class = Less than $50k>, fillcolor="#40a0e6"] ;
88 -> 92 ;
93 [label=<gini = 0.04<br/>samples = 94<br/>value = [1.948, 94.521]<br/>class = Less than $50k>, fillcolor="#3d9fe6"] ;
92 -> 93 ;
94 [label=<gini = 0.152<br/>samples = 23<br/>value = [1.948, 21.575]<br/>class = Less than $50k>, fillcolor="#4ba6e7"] ;
92 -> 94 ;
95 [label=<gini = 0.0<br/>samples = 1<br/>value = [0.974, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
87 -> 95 ;
96 [label=<hours_per_week ≤ 97.5<br/>gini = 0.337<br/>samples = 34<br/>value = [26.299, 7.192]<br/>class = Over $50k>, fillcolor="#eca36f"] ;
54 -> 96 ;
97 [label=<age ≤ 59.0<br/>gini = 0.308<br/>samples = 33<br/>value = [26.299, 6.164]<br/>class = Over $50k>, fillcolor="#eb9f67"] ;
96 -> 97 ;
98 [label=<age ≤ 50.0<br/>gini = 0.395<br/>samples = 23<br/>value = [16.558, 6.164]<br/>class = Over $50k>, fillcolor="#efb083"] ;
97 -> 98 ;
99 [label=<hours_per_week ≤ 42.5<br/>gini = 0.319<br/>samples = 21<br/>value = [16.558, 4.11]<br/>class = Over $50k>, fillcolor="#eba06a"] ;
98 -> 99 ;
100 [label=<age ≤ 31.0<br/>gini = 0.401<br/>samples = 15<br/>value = [10.714, 4.11]<br/>class = Over $50k>, fillcolor="#efb185"] ;
99 -> 100 ;
101 [label=<gini = 0.254<br/>samples = 7<br/>value = [5.844, 1.027]<br/>class = Over $50k>, fillcolor="#ea975c"] ;
100 -> 101 ;
102 [label=<gini = 0.475<br/>samples = 8<br/>value = [4.87, 3.082]<br/>class = Over $50k>, fillcolor="#f5d1b6"] ;
100 -> 102 ;
103 [label=<gini = 0.0<br/>samples = 6<br/>value = [5.844, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
99 -> 103 ;
104 [label=<gini = -0.0<br/>samples = 2<br/>value = [0.0, 2.055]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
98 -> 104 ;
105 [label=<gini = 0.0<br/>samples = 10<br/>value = [9.74, 0.0]<br/>class = Over $50k>, fillcolor="#e58139"] ;
97 -> 105 ;
106 [label=<gini = -0.0<br/>samples = 1<br/>value = [0.0, 1.027]<br/>class = Less than $50k>, fillcolor="#399de5"] ;
96 -> 106 ;
}