form <- as.formula("income ~ age + workclass + education + marital.status + occupation + relationship + race + sex + capital.gain + capital.loss + hours.per.week")
mod_tree <- rpart(form, data = train)
mod_tree
## n= 26049
##
## node), split, n, loss, yval, (yprob)
## * denotes terminal node
##
## 1) root 26049 6317 <=50K (0.75749549 0.24250451)
## 2) relationship=Not-in-family,Other-relative,Own-child,Unmarried 14196 947 <=50K (0.93329107 0.06670893)
## 4) capital.gain< 7073.5 13946 706 <=50K (0.94937617 0.05062383) *
## 5) capital.gain>=7073.5 250 9 >50K (0.03600000 0.96400000) *
## 3) relationship=Husband,Wife 11853 5370 <=50K (0.54695014 0.45304986)
## 6) education=10th,11th,12th,1st-4th,5th-6th,7th-8th,9th,Assoc-acdm,Assoc-voc,HS-grad,Preschool,Some-college 8280 2769 <=50K (0.66557971 0.33442029)
## 12) capital.gain< 5095.5 7857 2355 <=50K (0.70026728 0.29973272) *
## 13) capital.gain>=5095.5 423 9 >50K (0.02127660 0.97872340) *
## 7) education=Bachelors,Doctorate,Masters,Prof-school 3573 972 >50K (0.27204030 0.72795970) *