lpga <- read.csv("http://www.stat.ufl.edu/~winner/sta4210/mydata/lpga2008.csv",header=TRUE) attach(lpga); names(lpga) #install.packages("rpart") library(rpart) (lpgatree1 <- rpart(lnprz ~dist+fairway+green+putts+sandsv, lpga,method="anova")) plot(lpgatree1,compress=T,uniform=T,branch=0.4,margin=.10) text(lpgatree1) printcp(lpgatree1) lpgatree2 <- prune.rpart(lpgatree1,.010561) plot(lpgatree2,compress=T,uniform=T,branch=0.4,margin=.10) text(lpgatree2) 1-sum(residuals(lpgatree2)^2)/sum((lnprz-mean(lnprz))^2) lpgatree3 <- prune.rpart(lpgatree1,.027677) plot(lpgatree3,compress=T,uniform=T,branch=0.4,margin=.10) text(lpgatree3) 1-sum(residuals(lpgatree3)^2)/sum((lnprz-mean(lnprz))^2) lpgaols1 <- lm(lnprz ~dist+fairway+green+putts+sandsv,lpga) summary(lpgaols1)