rm(list=ls())

Predicting The Sales of Carseat¶

We first use classification trees to analyze the Carseats data set. The main goal is to predict the Sales of Carseats and find important features that influence the sales. In these data, Sales is a continuous variable, and so we begin by recoding it as a binary variable. We use the ifelse() function to create a variable, called ifelse() High, which takes on a value of Yes if the Sales variable exceeds 8, and takes on a value of No otherwise.

library (ISLR)
library(plotly)

Data¶

A data frame with 400 observations on the following 11 variables.

Sales- Unit sales (in thousands) at each location
CompPrice - Price charged by competitor at each location
Income - Community income level (in thousands of dollars)
Advertising - Local advertising budget for company at each location (in thousands of dollars)
Population - Population size in region (in thousands)
Price - Price company charges for car seats at each site
ShelveLoc - A factor with levels Bad, Good and Medium indicating the quality of the shelving location for the car seats at each site
Age -Average age of the local population
Education -Education level at each location
Urban -A factor with levels No and Yes to indicate whether the store is in an urban or rural location
US -A factor with levels No and Yes to indicate whether the store is in the US or not

head(Carseats)

sum(is.na(Carseats))

summary(Carseats)

     Sales          CompPrice       Income        Advertising    
 Min.   : 0.000   Min.   : 77   Min.   : 21.00   Min.   : 0.000  
 1st Qu.: 5.390   1st Qu.:115   1st Qu.: 42.75   1st Qu.: 0.000  
 Median : 7.490   Median :125   Median : 69.00   Median : 5.000  
 Mean   : 7.496   Mean   :125   Mean   : 68.66   Mean   : 6.635  
 3rd Qu.: 9.320   3rd Qu.:135   3rd Qu.: 91.00   3rd Qu.:12.000  
 Max.   :16.270   Max.   :175   Max.   :120.00   Max.   :29.000  
   Population        Price        ShelveLoc        Age          Education   
 Min.   : 10.0   Min.   : 24.0   Bad   : 96   Min.   :25.00   Min.   :10.0  
 1st Qu.:139.0   1st Qu.:100.0   Good  : 85   1st Qu.:39.75   1st Qu.:12.0  
 Median :272.0   Median :117.0   Medium:219   Median :54.50   Median :14.0  
 Mean   :264.8   Mean   :115.8                Mean   :53.32   Mean   :13.9  
 3rd Qu.:398.5   3rd Qu.:131.0                3rd Qu.:66.00   3rd Qu.:16.0  
 Max.   :509.0   Max.   :191.0                Max.   :80.00   Max.   :18.0  
 Urban       US     
 No :118   No :142  
 Yes:282   Yes:258

In these data, Sales is a continuous variable, and so we begin by recoding it as a binary variable. We use the ifelse() function to create a variable, called High, which takes on a value of Yes if the Sales variable exceeds 8, and takes on a value of No otherwise.

Carseats$Income

attach(Carseats)

The following objects are masked from Carseats (pos = 3):

    Advertising, Age, CompPrice, Education, Income, Population, Price,
    Sales, ShelveLoc, Urban, US

The following objects are masked from Carseats (pos = 5):

    Advertising, Age, CompPrice, Education, Income, Population, Price,
    Sales, ShelveLoc, Urban, US

Income

Carseats$High=ifelse(Sales <=8,0,1)

factor(High)

Finally, we use the data.frame() function to merge High with the rest of the Carseats data.

head(Carseats)

plot(Carseats$Price,Carseats$Advertising,col=c("red","blue")[Carseats$High])

plot(Advertising,ShelveLoc,col=c("red","blue")[High])

plot_ly(Carseats, x = ~Price, y = ~Advertising, z = ~ShelveLoc, color = ~High, colors = c('#BF382A', '#0C4B8E')) %>%
  add_markers() %>%
  layout(scene = list(xaxis = list(title = ''),
                     yaxis = list(title = ''),
                     zaxis = list(title = '')))

ERROR while rich displaying an object: Error in Summary.factor(structure(c(1L, 2L, 3L, 3L, 1L, 1L, 3L, 2L, 3L, : 'range' not meaningful for factors

Traceback:
1. FUN(X[[i]], ...)
2. tryCatch(withCallingHandlers({
 .     rpr <- mime2repr[[mime]](obj)
 .     if (is.null(rpr)) 
 .         return(NULL)
 .     prepare_content(is.raw(rpr), rpr)
 . }, error = error_handler), error = outer_handler)
3. tryCatchList(expr, classes, parentenv, handlers)
4. tryCatchOne(expr, names, parentenv, handlers[[1L]])
5. doTryCatch(return(expr), name, parentenv, handler)
6. withCallingHandlers({
 .     rpr <- mime2repr[[mime]](obj)
 .     if (is.null(rpr)) 
 .         return(NULL)
 .     prepare_content(is.raw(rpr), rpr)
 . }, error = error_handler)
7. mime2repr[[mime]](obj)
8. repr_html.htmlwidget(obj)
9. htmlwidgets::saveWidget(obj, htmlfile)
10. toHTML(widget, standalone = TRUE, knitrOptions = knitrOptions)
11. htmltools::tagList(container(htmltools::tagList(x$prepend, widget_html(name = class(x)[1], 
  .     package = attr(x, "package"), id = id, style = style, class = paste(class(x)[1], 
  .         "html-widget"), width = sizeInfo$width, height = sizeInfo$height), 
  .     x$append)), widget_data(x, id), if (!is.null(sizeInfo$runtime)) {
  .     tags$script(type = "application/htmlwidget-sizing", `data-for` = id, 
  .         toJSON(sizeInfo$runtime))
  . })
12. widget_data(x, id)
13. toJSON(createPayload(x))
14. createPayload(x)
15. instance$preRenderHook(instance)
16. plotly_build.plotly(instance)
17. map_color(traces, title = paste(colorTitle, collapse = br()))
18. Summary.factor(structure(c(1L, 2L, 3L, 3L, 1L, 1L, 3L, 2L, 3L, 
  . 3L, 1L, 2L, 3L, 2L, 2L, 3L, 2L, 2L, 2L, 3L, 3L, 2L, 3L, 3L, 1L, 
  . 2L, 2L, 3L, 1L, 1L, 2L, 3L, 2L, 2L, 3L, 3L, 2L, 3L, 3L, 1L, 1L, 
  . 1L, 3L, 3L, 3L, 1L, 3L, 1L, 1L, 2L, 1L, 1L, 1L, 3L, 3L, 3L, 3L, 
  . 1L, 1L, 3L, 1L, 3L, 1L, 3L, 3L, 3L, 3L, 3L, 2L, 3L, 2L, 3L, 3L, 
  . 2L, 3L, 1L, 3L, 3L, 3L, 1L, 1L, 2L, 2L, 1L, 1L, 3L, 3L, 2L, 3L, 
  . 3L, 3L, 3L, 3L, 3L, 1L, 3L, 2L, 1L, 2L, 1L, 3L, 3L, 3L, 1L, 3L, 
  . 3L, 3L, 3L, 1L, 3L, 3L, 3L, 2L, 1L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 
  . 1L, 3L, 2L, 2L, 3L, 2L, 3L, 1L, 1L, 3L, 3L, 2L, 1L, 3L, 3L, 1L, 
  . 3L, 3L, 3L, 3L, 1L, 3L, 1L, 2L, 3L, 1L, 2L, 3L, 3L, 2L, 2L, 2L, 
  . 3L, 3L, 3L, 2L, 3L, 2L, 1L, 3L, 3L, 3L, 1L, 3L, 1L, 3L, 3L, 3L, 
  . 2L, 3L, 3L, 2L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 1L, 3L, 1L, 3L, 3L, 
  . 3L, 3L, 1L, 3L, 3L, 3L, 2L, 3L, 2L, 3L, 1L, 1L, 3L, 3L, 3L, 3L, 
  . 3L, 1L, 1L, 3L, 3L, 3L, 1L, 1L, 1L, 1L, 3L, 3L, 3L, 3L, 1L, 3L, 
  . 3L, 3L, 2L, 3L, 3L, 3L, 3L, 3L, 1L, 2L, 3L, 1L, 3L, 1L, 3L, 2L, 
  . 3L, 2L, 3L, 3L, 3L, 2L, 1L, 3L, 3L, 3L, 3L, 3L, 2L, 1L, 1L, 3L, 
  . 1L, 2L, 1L, 3L, 3L, 2L, 1L, 3L, 3L, 1L, 1L, 1L, 3L, 3L, 3L, 2L, 
  . 1L, 2L, 1L, 3L, 3L, 2L, 3L, 2L, 3L, 3L, 3L, 3L, 3L, 2L, 3L, 1L, 
  . 2L, 2L, 3L, 1L, 3L, 3L, 1L, 3L, 3L, 3L, 1L, 2L, 2L, 2L, 3L, 2L, 
  . 1L, 2L, 3L, 3L, 3L, 1L, 3L, 2L, 3L, 3L, 1L, 3L, 1L, 3L, 1L, 1L, 
  . 3L, 2L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 2L, 3L, 1L, 3L, 3L, 3L, 1L, 
  . 2L, 1L, 3L, 3L, 3L, 1L, 3L, 1L, 3L, 3L, 2L, 1L, 3L, 3L, 1L, 2L, 
  . 2L, 3L, 2L, 2L, 3L, 3L, 3L, 2L, 3L, 3L, 2L, 2L, 3L, 1L, 1L, 2L, 
  . 3L, 1L, 2L, 2L, 3L, 3L, 2L, 2L, 3L, 1L, 3L, 3L, 3L, 3L, 3L, 2L, 
  . 3L, 3L, 1L, 3L, 1L, 3L, 3L, 2L, 3L, 3L, 3L, 1L, 3L, 3L, 1L, 1L, 
  . 3L, 1L, 2L, 3L, 3L, 1L, 2L), .Label = c("Bad", "Good", "Medium"
  . ), class = "factor"), na.rm = TRUE)
19. stop(gettextf("%s not meaningful for factors", sQuote(.Generic)))

HTML widgets cannot be represented in plain text (need html)

Logistic regression¶

l <- glm(High~. -Sales, data = Carseats, family=binomial)

summary(l)

Call:
glm(formula = High ~ . - Sales, family = binomial, data = Carseats)

Deviance Residuals: 
     Min        1Q    Median        3Q       Max  
-2.40315  -0.28543  -0.04319   0.18482   2.98849  

Coefficients:
                  Estimate Std. Error z value Pr(>|z|)    
(Intercept)     -5.0889857  2.4067745  -2.114   0.0345 *  
CompPrice        0.1724750  0.0233456   7.388 1.49e-13 ***
Income           0.0341248  0.0079002   4.319 1.56e-05 ***
Advertising      0.2957492  0.0512506   5.771 7.90e-09 ***
Population      -0.0009173  0.0014190  -0.646   0.5180    
Price           -0.1674933  0.0196266  -8.534  < 2e-16 ***
ShelveLocGood    8.2408876  1.0328293   7.979 1.48e-15 ***
ShelveLocMedium  3.5970462  0.6520385   5.517 3.46e-08 ***
Age             -0.0793793  0.0142195  -5.582 2.37e-08 ***
Education       -0.0576359  0.0763170  -0.755   0.4501    
UrbanYes        -0.3827861  0.4392739  -0.871   0.3835    
USYes           -0.6986095  0.5949922  -1.174   0.2403    
---
Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1

(Dispersion parameter for binomial family taken to be 1)

    Null deviance: 541.49  on 399  degrees of freedom
Residual deviance: 181.48  on 388  degrees of freedom
AIC: 205.48

Number of Fisher Scoring iterations: 7

exp(0.295)

1-exp(-0.383)

This fitted model says that, we will see $34\%$ increase in the odds of High Sales for a one-unit increase in Advertising,since $exp(0.295) = 1.34$, holding the rest fix. holding the rest at a fixed value, the odds of having High Sales for Stores in Urban areas (Urban = 1) over the odds of having High Sales for non Urban stores is $exp(-0.383) = 0.681$. In terms of percent change, we can say that the odds for Urban stores having high sales are 32% lower than the odds for non Urban.

Prediction¶

set.seed(33)
#data<-read.csv("default1.csv")
test.index <- sample(1:nrow(Carseats), size = 150, replace = F)
test <- Carseats[test.index,]
train <- Carseats[-test.index,]

l <- glm(High~. -Sales, data = train, family=binomial)

In Sample Prediction¶

l.pred <- predict(l, train, type = "response")
l.pred1 <- as.numeric(l.pred > 0.5)

l.table<-table(l.pred1 ,train$High )
l.table

       
l.pred1   0   1
      0 139  15
      1  14  82

sum(l.pred1)

(139+82)/250

summary.pred<-function(x)
    {
        FPR<-x[1,2]/sum(x[1,])
        TPR<-x[2,2]/sum(x[2,])
        PPR<-x[2,2]/sum(x[,2])
        NPR<-x[1,1]/sum(x[,1])
    
        output<-list("FPR"=round(FPR,2),"TPR"=round(TPR,2),"PPR"=round(PPR,2),"NPR"=round(NPR,2))
    return(output)
    }

l.pred.summary<-summary.pred(l.table)
l.pred.summary

Out of Sample Prediction¶

l.pred <- predict(l, test, type = "response")
l.pred1 <- as.numeric(l.pred > 0.5)

l.table.test<-table(l.pred1 ,test$High )
l.table.test

       
l.pred1  0  1
      0 80 11
      1  3 56

(80+56)/150

l.test.pred.summary<-summary.pred(l.table)
l.test.pred.summary

Tree Based Models¶

We now use the tree() function to fit a classification tree in order to predict tree() High using all variables but Sales. The syntax of the tree() function is quite similar to that of the lm() function.

library(tree)

tree.carseats =tree(High∼.-Sales ,Carseats )

summary (tree.carseats )

Classification tree:
tree(formula = High ~ . - Sales, data = Carseats)
Variables actually used in tree construction:
[1] "ShelveLoc"   "Price"       "Income"      "CompPrice"   "Population" 
[6] "Advertising" "Age"         "US"         
Number of terminal nodes:  27 
Residual mean deviance:  0.4575 = 170.7 / 373 
Misclassification error rate: 0.09 = 36 / 400

We see that the training error rate is 9 %. For classification trees, the deviance reported in the output of summary() is given by $$-2 \sum_m \sum_k n_{mk}\log \hat p_{mk}$$ where $n_{mk}$ is the number of observations in the $m$th terminal node that belong to the $k$th class. A small deviance indicates a tree that provides a good fit to the (training) data. The residual mean deviance reported is simply the deviance divided by $n−|T_0|$, which in this case is $400−27 = 373$. One of the most attractive properties of trees is that they can be graphically displayed. We use the plot() function to display the tree structure, and the text() function to display the node labels. The argument pretty=0 instructs R to include the category names for any qualitative predictors, rather than simply displaying a letter for each category.

plot(tree.carseats )
text(tree.carseats ,pretty =0)

The most important indicator of Sales appears to be shelving location, since the first branch differentiates Good locations from Bad and Medium locations. If we just type the name of the tree object, R prints output corresponding to each branch of the tree. R displays the split criterion (e.g. $Price<92.5$), the number of observations in that branch, the deviance, the overall prediction for the branch (Yes or No), and the fraction of observations in that branch that take on values of Yes and No. Branches that lead to terminal nodes are indicated using asterisks.

tree.carseats

node), split, n, deviance, yval, (yprob)
      * denotes terminal node

  1) root 400 541.500 0 ( 0.59000 0.41000 )  
    2) ShelveLoc: Bad,Medium 315 390.600 0 ( 0.68889 0.31111 )  
      4) Price < 92.5 46  56.530 1 ( 0.30435 0.69565 )  
        8) Income < 57 10  12.220 0 ( 0.70000 0.30000 )  
         16) CompPrice < 110.5 5   0.000 0 ( 1.00000 0.00000 ) *
         17) CompPrice > 110.5 5   6.730 1 ( 0.40000 0.60000 ) *
        9) Income > 57 36  35.470 1 ( 0.19444 0.80556 )  
         18) Population < 207.5 16  21.170 1 ( 0.37500 0.62500 ) *
         19) Population > 207.5 20   7.941 1 ( 0.05000 0.95000 ) *
      5) Price > 92.5 269 299.800 0 ( 0.75465 0.24535 )  
       10) Advertising < 13.5 224 213.200 0 ( 0.81696 0.18304 )  
         20) CompPrice < 124.5 96  44.890 0 ( 0.93750 0.06250 )  
           40) Price < 106.5 38  33.150 0 ( 0.84211 0.15789 )  
             80) Population < 177 12  16.300 0 ( 0.58333 0.41667 )  
              160) Income < 60.5 6   0.000 0 ( 1.00000 0.00000 ) *
              161) Income > 60.5 6   5.407 1 ( 0.16667 0.83333 ) *
             81) Population > 177 26   8.477 0 ( 0.96154 0.03846 ) *
           41) Price > 106.5 58   0.000 0 ( 1.00000 0.00000 ) *
         21) CompPrice > 124.5 128 150.200 0 ( 0.72656 0.27344 )  
           42) Price < 122.5 51  70.680 1 ( 0.49020 0.50980 )  
             84) ShelveLoc: Bad 11   6.702 0 ( 0.90909 0.09091 ) *
             85) ShelveLoc: Medium 40  52.930 1 ( 0.37500 0.62500 )  
              170) Price < 109.5 16   7.481 1 ( 0.06250 0.93750 ) *
              171) Price > 109.5 24  32.600 0 ( 0.58333 0.41667 )  
                342) Age < 49.5 13  16.050 1 ( 0.30769 0.69231 ) *
                343) Age > 49.5 11   6.702 0 ( 0.90909 0.09091 ) *
           43) Price > 122.5 77  55.540 0 ( 0.88312 0.11688 )  
             86) CompPrice < 147.5 58  17.400 0 ( 0.96552 0.03448 ) *
             87) CompPrice > 147.5 19  25.010 0 ( 0.63158 0.36842 )  
              174) Price < 147 12  16.300 1 ( 0.41667 0.58333 )  
                348) CompPrice < 152.5 7   5.742 1 ( 0.14286 0.85714 ) *
                349) CompPrice > 152.5 5   5.004 0 ( 0.80000 0.20000 ) *
              175) Price > 147 7   0.000 0 ( 1.00000 0.00000 ) *
       11) Advertising > 13.5 45  61.830 1 ( 0.44444 0.55556 )  
         22) Age < 54.5 25  25.020 1 ( 0.20000 0.80000 )  
           44) CompPrice < 130.5 14  18.250 1 ( 0.35714 0.64286 )  
             88) Income < 100 9  12.370 0 ( 0.55556 0.44444 ) *
             89) Income > 100 5   0.000 1 ( 0.00000 1.00000 ) *
           45) CompPrice > 130.5 11   0.000 1 ( 0.00000 1.00000 ) *
         23) Age > 54.5 20  22.490 0 ( 0.75000 0.25000 )  
           46) CompPrice < 122.5 10   0.000 0 ( 1.00000 0.00000 ) *
           47) CompPrice > 122.5 10  13.860 0 ( 0.50000 0.50000 )  
             94) Price < 125 5   0.000 1 ( 0.00000 1.00000 ) *
             95) Price > 125 5   0.000 0 ( 1.00000 0.00000 ) *
    3) ShelveLoc: Good 85  90.330 1 ( 0.22353 0.77647 )  
      6) Price < 135 68  49.260 1 ( 0.11765 0.88235 )  
       12) US: No 17  22.070 1 ( 0.35294 0.64706 )  
         24) Price < 109 8   0.000 1 ( 0.00000 1.00000 ) *
         25) Price > 109 9  11.460 0 ( 0.66667 0.33333 ) *
       13) US: Yes 51  16.880 1 ( 0.03922 0.96078 ) *
      7) Price > 135 17  22.070 0 ( 0.64706 0.35294 )  
       14) Income < 46 6   0.000 0 ( 1.00000 0.00000 ) *
       15) Income > 46 11  15.160 1 ( 0.45455 0.54545 ) *

In order to properly evaluate the performance of a classification tree on these data, we must estimate the test error rather than simply computing the training error. We split the observations into a training set and a test set, build the tree using the training set, and evaluate its performance on the test data. The predict() function can be used for this purpose. In the case of a classification tree, the argument type="class" instructs R to return the actual class prediction. This approach leads to correct predictions for around $80\%$ of the locations in the test data set.

tree.carseats =tree(High∼.-Sales ,train )
tree.pred=predict (tree.carseats ,test ,type ="class")
t.table<-table(tree.pred ,test$High)
t.table

         
tree.pred  0  1
        0 64 20
        1 19 47

(97+49)/200

t.test.pred.summary<-summary.pred(t.table)
t.test.pred.summary

Next, we consider whether pruning the tree might lead to improved results. The function cv.tree() performs cross-validation in order to cv.tree() determine the optimal level of tree complexity; cost complexity pruning is used in order to select a sequence of trees for consideration. We use the argument FUN=prune.misclass in order to indicate that we want the classification error rate to guide the cross-validation and pruning process, rather than the default for the cv.tree() function, which is deviance. The cv.tree() function reports the number of terminal nodes of each tree considered (size) as well as the corresponding error rate and the value of the cost-complexity parameter used (k, which corresponds to $\alpha$(Lokk formula in Lecture Notes)).

set.seed (3)
cv.carseats =cv.tree(tree.carseats ,FUN=prune.misclass )
names(cv.carseats )
cv.carseats

$size
[1] 21 19 13  9  5  2  1

$dev
[1] 71 71 66 58 55 71 97

$k
[1]      -Inf  0.000000  1.000000  1.500000  2.500000  8.333333 26.000000

$method
[1] "misclass"

attr(,"class")
[1] "prune"         "tree.sequence"

Note that, despite the name, dev corresponds to the cross-validation error rate in this instance. The tree with $9$ terminal nodes results in the lowest cross-validation error rate, with $50$ cross-validation errors.We plot the error rate as a function of both size and $k$.

par(mfrow =c(1,2))
plot(cv.carseats$size ,cv.carseats$dev ,type="b")
plot(cv.carseats$k ,cv.carseats$dev ,type="b")

We now apply the prune.misclass() function in order to prune the tree to prune. obtain the nine-node tree.

prune.carseats =prune.misclass (tree.carseats ,best =5)
plot(prune.carseats )
text(prune.carseats ,pretty =0)

How well does this pruned tree perform on the test data set? Once again, we apply the predict() function.

Next, we consider whether pruning the tree might lead to improved results. The function cv.tree() performs cross-validation in order to cv.tree() determine the optimal level of tree complexity; cost complexity pruning is used in order to select a sequence of trees for consideration. We use the argument FUN=prune.misclass in order to indicate that we want the classification error rate to guide the cross-validation and pruning process, rather than the default for the cv.tree() function, which is deviance. The cv.tree() function reports the number of terminal nodes of each tree considered (size) as well as the corresponding error rate and the value of the cost-complexity parameter used (k, which corresponds to $\alpha$ ).

tree.pred=predict (prune.carseats , test ,type="class")
t.table<-table(tree.pred ,test$High)
t.table

         
tree.pred  0  1
        0 64 18
        1 19 49

(64+49)/150

t.test.pred.summary<-summary.pred(t.table)
t.test.pred.summary

Now $75\%$ of the test observations are correctly classified, so not only has the pruning process produced a more interpretable tree, but it has also improved the classification accuracy.

Bagging¶

dim(train)

library(randomForest)
set.seed (1)
bag.model =randomForest(High∼.,data=train ,
mtry=11, importance =TRUE)
bag.model

Call:
 randomForest(formula = High ~ ., data = train, mtry = 11, importance = TRUE) 
               Type of random forest: classification
                     Number of trees: 500
No. of variables tried at each split: 11

        OOB estimate of  error rate: 0.4%
Confusion matrix:
    0  1 class.error
0 152  1 0.006535948
1   0 97 0.000000000

bag.pred = predict (bag.model ,newdata =test)

b.table<-table(bag.pred ,test$High)
b.table

        
bag.pred  0  1
       0 83  0
       1  0 67

(83+67)/150

b.test.pred.summary<-summary.pred(b.table)
b.test.pred.summary

Random Forest¶

set.seed (1)
rf.model =randomForest(High∼.,data=train ,
mtry=4, importance =TRUE)
rf.model
pred.rf = predict (rf.model,newdata =test)

Call:
 randomForest(formula = High ~ ., data = train, mtry = 4, importance = TRUE) 
               Type of random forest: classification
                     Number of trees: 500
No. of variables tried at each split: 4

        OOB estimate of  error rate: 0.4%
Confusion matrix:
    0  1 class.error
0 152  1 0.006535948
1   0 97 0.000000000

rf.table<-table(pred.rf ,test$High)
rf.table

       
pred.rf  0  1
      0 83  0
      1  0 67

Sales	CompPrice	Income	Advertising	Population	Price	ShelveLoc	Age	Education	Urban	US
9.50	138	73	11	276	120	Bad	42	17	Yes	Yes
11.22	111	48	16	260	83	Good	65	10	Yes	Yes
10.06	113	35	10	269	80	Medium	59	12	Yes	Yes
7.40	117	100	4	466	97	Medium	55	14	Yes	Yes
4.15	141	64	3	340	128	Bad	38	13	Yes	No
10.81	124	113	13	501	72	Bad	78	16	No	Yes