Reading the file

setwd("E:/Great Lakes/Data Mining/Assignment")
ploan <- read.csv("PL_XSELL.csv",header=TRUE)

converting to factor data type

ploan$FLG_HAS_ANY_CHGS <- as.factor(ploan$FLG_HAS_ANY_CHGS)
ploan$FLG_HAS_CC <- as.factor(ploan$FLG_HAS_CC)
ploan$FLG_HAS_NOMINEE <- as.factor(ploan$FLG_HAS_NOMINEE)
ploan$FLG_HAS_OLD_LOAN <- as.factor(ploan$FLG_HAS_OLD_LOAN)
ploan$ACC_OP_DATE <- as.Date(ploan$ACC_OP_DATE, format = "%m/%d/%Y")

checking for missing values

library(VIM)
## Warning: package 'VIM' was built under R version 3.4.3
## Loading required package: colorspace
## Loading required package: grid
## Loading required package: data.table
## Warning: package 'data.table' was built under R version 3.4.3
## VIM is ready to use. 
##  Since version 4.0.0 the GUI is in its own package VIMGUI.
## 
##           Please use the package to use the new (and old) GUI.
## Suggestions and bug-reports can be submitted at: https://github.com/alexkowa/VIM/issues
## 
## Attaching package: 'VIM'
## The following object is masked from 'package:datasets':
## 
##     sleep
aggr(ploan,prop = F,cex.axis = 0.4,numbers=T)

feature engineering

quantile(ploan$BALANCE)
##         0%        25%        50%        75%       100% 
##       0.00   64754.03  231675.85  653876.85 8360430.57
ploan$LOW_BAL <- ifelse(ploan$BALANCE < 231676 ,0,1)
lowbal<- ifelse (ploan$LOW_BAL == 0 & ploan$TARGET == 1,1,0)
totbal <- sum(lowbal)
prebal <- (totbal/2512)*100
quantile(ploan$HOLDING_PERIOD)
##   0%  25%  50%  75% 100% 
##    1    7   15   22   31
ploan$LOW_BAL <- as.factor(ploan$LOW_BAL)

ploan$LOW_HOLD <- ifelse(ploan$HOLDING_PERIOD < 15 ,0,1)
lowhold <- ifelse (ploan$LOW_HOLD == 0 & ploan$TARGET == 1,1,0)
tothold <- sum(lowhold)
prehold <- (tothold/2512)*100
ploan$LOW_HOLD <- as.factor(ploan$LOW_HOLD)

response rate

resprate <- (sum(ploan$TARGET)/nrow(ploan))* 100
resprate
## [1] 12.56

descriptive stastics

summary(ploan)
##     CUST_ID          TARGET            AGE        GENDER   
##  C1     :    1   Min.   :0.0000   Min.   :21.00   F: 5433  
##  C10    :    1   1st Qu.:0.0000   1st Qu.:30.00   M:14376  
##  C100   :    1   Median :0.0000   Median :38.00   O:  191  
##  C1000  :    1   Mean   :0.1256   Mean   :38.42            
##  C10000 :    1   3rd Qu.:0.0000   3rd Qu.:46.00            
##  C10001 :    1   Max.   :1.0000   Max.   :55.00            
##  (Other):19994                                             
##     BALANCE           OCCUPATION    AGE_BKT          SCR       
##  Min.   :      0   PROF    :5417   <25  :1753   Min.   :100.0  
##  1st Qu.:  64754   SAL     :5855   >50  :3035   1st Qu.:227.0  
##  Median : 231676   SELF-EMP:3568   26-30:3434   Median :364.0  
##  Mean   : 511362   SENP    :5160   31-35:3404   Mean   :440.2  
##  3rd Qu.: 653877                   36-40:2814   3rd Qu.:644.0  
##  Max.   :8360431                   41-45:3067   Max.   :999.0  
##                                    46-50:2493                  
##  HOLDING_PERIOD  ACC_TYPE    ACC_OP_DATE         LEN_OF_RLTN_IN_MNTH
##  Min.   : 1.00   CA: 4241   Min.   :1999-01-02   Min.   : 29.0      
##  1st Qu.: 7.00   SA:15759   1st Qu.:2003-01-26   1st Qu.: 79.0      
##  Median :15.00              Median :2006-12-23   Median :125.0      
##  Mean   :14.96              Mean   :2006-12-25   Mean   :125.2      
##  3rd Qu.:22.00              3rd Qu.:2010-11-16   3rd Qu.:172.0      
##  Max.   :31.00              Max.   :2015-01-01   Max.   :221.0      
##                                                                     
##  NO_OF_L_CR_TXNS NO_OF_L_DR_TXNS  TOT_NO_OF_L_TXNS
##  Min.   : 0.00   Min.   : 0.000   Min.   :  0.00  
##  1st Qu.: 6.00   1st Qu.: 2.000   1st Qu.:  9.00  
##  Median :10.00   Median : 5.000   Median : 14.00  
##  Mean   :12.35   Mean   : 6.634   Mean   : 18.98  
##  3rd Qu.:14.00   3rd Qu.: 7.000   3rd Qu.: 21.00  
##  Max.   :75.00   Max.   :74.000   Max.   :149.00  
##                                                   
##  NO_OF_BR_CSH_WDL_DR_TXNS NO_OF_ATM_DR_TXNS NO_OF_NET_DR_TXNS
##  Min.   : 0.000           Min.   : 0.000    Min.   : 0.000   
##  1st Qu.: 1.000           1st Qu.: 0.000    1st Qu.: 0.000   
##  Median : 1.000           Median : 1.000    Median : 0.000   
##  Mean   : 1.883           Mean   : 1.029    Mean   : 1.172   
##  3rd Qu.: 2.000           3rd Qu.: 1.000    3rd Qu.: 1.000   
##  Max.   :15.000           Max.   :25.000    Max.   :22.000   
##                                                              
##  NO_OF_MOB_DR_TXNS NO_OF_CHQ_DR_TXNS FLG_HAS_CC   AMT_ATM_DR    
##  Min.   : 0.0000   Min.   : 0.000    0:13892    Min.   :     0  
##  1st Qu.: 0.0000   1st Qu.: 0.000    1: 6108    1st Qu.:     0  
##  Median : 0.0000   Median : 2.000               Median :  6900  
##  Mean   : 0.4118   Mean   : 2.138               Mean   : 10990  
##  3rd Qu.: 0.0000   3rd Qu.: 4.000               3rd Qu.: 15800  
##  Max.   :25.0000   Max.   :15.000               Max.   :199300  
##                                                                 
##  AMT_BR_CSH_WDL_DR   AMT_CHQ_DR        AMT_NET_DR       AMT_MOB_DR    
##  Min.   :     0    Min.   :      0   Min.   :     0   Min.   :     0  
##  1st Qu.:  2990    1st Qu.:      0   1st Qu.:     0   1st Qu.:     0  
##  Median :340150    Median :  23840   Median :     0   Median :     0  
##  Mean   :378475    Mean   : 124520   Mean   :237308   Mean   : 22425  
##  3rd Qu.:674675    3rd Qu.:  72470   3rd Qu.:473971   3rd Qu.:     0  
##  Max.   :999930    Max.   :4928640   Max.   :999854   Max.   :199667  
##                                                                       
##     AMT_L_DR       FLG_HAS_ANY_CHGS AMT_OTH_BK_ATM_USG_CHGS
##  Min.   :      0   0:17788          Min.   :  0.000        
##  1st Qu.: 237936   1: 2212          1st Qu.:  0.000        
##  Median : 695115                    Median :  0.000        
##  Mean   : 773717                    Mean   :  1.099        
##  3rd Qu.:1078927                    3rd Qu.:  0.000        
##  Max.   :6514921                    Max.   :250.000        
##                                                            
##  AMT_MIN_BAL_NMC_CHGS NO_OF_IW_CHQ_BNC_TXNS NO_OF_OW_CHQ_BNC_TXNS
##  Min.   :  0.000      Min.   :0.00000       Min.   :0.0000       
##  1st Qu.:  0.000      1st Qu.:0.00000       1st Qu.:0.0000       
##  Median :  0.000      Median :0.00000       Median :0.0000       
##  Mean   :  1.292      Mean   :0.04275       Mean   :0.0444       
##  3rd Qu.:  0.000      3rd Qu.:0.00000       3rd Qu.:0.0000       
##  Max.   :170.000      Max.   :2.00000       Max.   :2.0000       
##                                                                  
##  AVG_AMT_PER_ATM_TXN AVG_AMT_PER_CSH_WDL_TXN AVG_AMT_PER_CHQ_TXN
##  Min.   :    0       Min.   :     0          Min.   :     0     
##  1st Qu.:    0       1st Qu.:  1266          1st Qu.:     0     
##  Median : 6000       Median :147095          Median :  8645     
##  Mean   : 7409       Mean   :242237          Mean   : 25093     
##  3rd Qu.:13500       3rd Qu.:385000          3rd Qu.: 28605     
##  Max.   :25000       Max.   :999640          Max.   :537842     
##                                                                 
##  AVG_AMT_PER_NET_TXN AVG_AMT_PER_MOB_TXN FLG_HAS_NOMINEE FLG_HAS_OLD_LOAN
##  Min.   :     0      Min.   :     0      0: 1977         0:10141         
##  1st Qu.:     0      1st Qu.:     0      1:18023         1: 9859         
##  Median :     0      Median :     0                                      
##  Mean   :179059      Mean   : 20304                                      
##  3rd Qu.:257699      3rd Qu.:     0                                      
##  Max.   :999854      Max.   :199667                                      
##                                                                          
##      random          LOW_BAL   LOW_HOLD 
##  Min.   :0.0000114   0:10000   0: 9726  
##  1st Qu.:0.2481866   1:10000   1:10274  
##  Median :0.5061214                      
##  Mean   :0.5019330                      
##  3rd Qu.:0.7535712                      
##  Max.   :0.9999471                      
## 
str(ploan)
## 'data.frame':    20000 obs. of  42 variables:
##  $ CUST_ID                 : Factor w/ 20000 levels "C1","C10","C100",..: 17699 16532 11027 17984 2363 11747 18115 15556 15216 12494 ...
##  $ TARGET                  : int  0 0 0 0 0 0 0 0 0 0 ...
##  $ AGE                     : int  27 47 40 53 36 42 30 53 42 30 ...
##  $ GENDER                  : Factor w/ 3 levels "F","M","O": 2 2 2 2 2 1 2 1 1 2 ...
##  $ BALANCE                 : num  3384 287489 18217 71720 1671623 ...
##  $ OCCUPATION              : Factor w/ 4 levels "PROF","SAL","SELF-EMP",..: 3 2 3 2 1 1 1 2 3 1 ...
##  $ AGE_BKT                 : Factor w/ 7 levels "<25",">50","26-30",..: 3 7 5 2 5 6 3 2 6 3 ...
##  $ SCR                     : int  776 324 603 196 167 493 479 562 105 170 ...
##  $ HOLDING_PERIOD          : int  30 28 2 13 24 26 14 25 15 13 ...
##  $ ACC_TYPE                : Factor w/ 2 levels "CA","SA": 2 2 2 1 2 2 2 1 2 2 ...
##  $ ACC_OP_DATE             : Date, format: "2005-03-23" "2008-10-11" ...
##  $ LEN_OF_RLTN_IN_MNTH     : int  146 104 61 107 185 192 177 99 88 111 ...
##  $ NO_OF_L_CR_TXNS         : int  7 8 10 36 20 5 6 14 18 14 ...
##  $ NO_OF_L_DR_TXNS         : int  3 2 5 14 1 2 6 3 14 8 ...
##  $ TOT_NO_OF_L_TXNS        : int  10 10 15 50 21 7 12 17 32 22 ...
##  $ NO_OF_BR_CSH_WDL_DR_TXNS: int  0 0 1 4 1 1 0 3 6 3 ...
##  $ NO_OF_ATM_DR_TXNS       : int  1 1 1 2 0 1 1 0 2 1 ...
##  $ NO_OF_NET_DR_TXNS       : int  2 1 1 3 0 0 1 0 4 0 ...
##  $ NO_OF_MOB_DR_TXNS       : int  0 0 0 1 0 0 0 0 1 0 ...
##  $ NO_OF_CHQ_DR_TXNS       : int  0 0 2 4 0 0 4 0 1 4 ...
##  $ FLG_HAS_CC              : Factor w/ 2 levels "0","1": 1 1 1 1 1 2 1 1 2 1 ...
##  $ AMT_ATM_DR              : int  13100 6600 11200 26100 0 18500 6200 0 35400 18000 ...
##  $ AMT_BR_CSH_WDL_DR       : int  0 0 561120 673590 808480 379310 0 945160 198430 869880 ...
##  $ AMT_CHQ_DR              : int  0 0 49320 60780 0 0 10580 0 51490 32610 ...
##  $ AMT_NET_DR              : num  973557 799813 997570 741506 0 ...
##  $ AMT_MOB_DR              : int  0 0 0 71388 0 0 0 0 170332 0 ...
##  $ AMT_L_DR                : num  986657 806413 1619210 1573364 808480 ...
##  $ FLG_HAS_ANY_CHGS        : Factor w/ 2 levels "0","1": 1 2 2 1 1 1 2 1 1 1 ...
##  $ AMT_OTH_BK_ATM_USG_CHGS : int  0 0 0 0 0 0 0 0 0 0 ...
##  $ AMT_MIN_BAL_NMC_CHGS    : int  0 0 0 0 0 0 0 0 0 0 ...
##  $ NO_OF_IW_CHQ_BNC_TXNS   : int  0 0 0 0 0 0 0 0 0 0 ...
##  $ NO_OF_OW_CHQ_BNC_TXNS   : int  0 0 1 0 0 0 0 0 0 0 ...
##  $ AVG_AMT_PER_ATM_TXN     : num  13100 6600 11200 13050 0 ...
##  $ AVG_AMT_PER_CSH_WDL_TXN : num  0 0 561120 168398 808480 ...
##  $ AVG_AMT_PER_CHQ_TXN     : num  0 0 24660 15195 0 ...
##  $ AVG_AMT_PER_NET_TXN     : num  486779 799813 997570 247169 0 ...
##  $ AVG_AMT_PER_MOB_TXN     : num  0 0 0 71388 0 ...
##  $ FLG_HAS_NOMINEE         : Factor w/ 2 levels "0","1": 2 2 2 2 2 2 1 2 2 1 ...
##  $ FLG_HAS_OLD_LOAN        : Factor w/ 2 levels "0","1": 2 1 2 1 1 2 2 2 2 1 ...
##  $ random                  : num  1.14e-05 1.11e-04 1.20e-04 1.37e-04 1.74e-04 ...
##  $ LOW_BAL                 : Factor w/ 2 levels "0","1": 1 2 1 1 2 2 1 1 1 2 ...
##  $ LOW_HOLD                : Factor w/ 2 levels "0","1": 2 2 1 1 2 2 1 2 2 1 ...
dim(ploan)
## [1] 20000    42
library(psych)
describe(ploan)
## Warning in FUN(newX[, i], ...): no non-missing arguments to min; returning
## Inf
## Warning in FUN(newX[, i], ...): no non-missing arguments to max; returning
## -Inf
##                          vars     n      mean        sd    median
## CUST_ID*                    1 20000  10000.50   5773.65  10000.50
## TARGET                      2 20000      0.13      0.33      0.00
## AGE                         3 20000     38.42      9.58     38.00
## GENDER*                     4 20000      1.74      0.46      2.00
## BALANCE                     5 20000 511362.19 723592.96 231675.85
## OCCUPATION*                 6 20000      2.42      1.14      2.00
## AGE_BKT*                    7 20000      4.08      1.85      4.00
## SCR                         8 20000    440.15    249.89    364.00
## HOLDING_PERIOD              9 20000     14.96      8.64     15.00
## ACC_TYPE*                  10 20000      1.79      0.41      2.00
## ACC_OP_DATE*               11 20000       NaN        NA        NA
## LEN_OF_RLTN_IN_MNTH        12 20000    125.24     54.95    125.00
## NO_OF_L_CR_TXNS            13 20000     12.35     12.15     10.00
## NO_OF_L_DR_TXNS            14 20000      6.63      7.68      5.00
## TOT_NO_OF_L_TXNS           15 20000     18.98     17.76     14.00
## NO_OF_BR_CSH_WDL_DR_TXNS   16 20000      1.88      2.26      1.00
## NO_OF_ATM_DR_TXNS          17 20000      1.03      1.50      1.00
## NO_OF_NET_DR_TXNS          18 20000      1.17      2.40      0.00
## NO_OF_MOB_DR_TXNS          19 20000      0.41      2.01      0.00
## NO_OF_CHQ_DR_TXNS          20 20000      2.14      2.38      2.00
## FLG_HAS_CC*                21 20000      1.31      0.46      1.00
## AMT_ATM_DR                 22 20000  10990.01  15304.89   6900.00
## AMT_BR_CSH_WDL_DR          23 20000 378474.48 331417.73 340150.00
## AMT_CHQ_DR                 24 20000 124520.01 439379.54  23840.00
## AMT_NET_DR                 25 20000 237307.77 319067.66      0.00
## AMT_MOB_DR                 26 20000  22424.70  49484.80      0.00
## AMT_L_DR                   27 20000 773716.97 712659.17 695115.00
## FLG_HAS_ANY_CHGS*          28 20000      1.11      0.31      1.00
## AMT_OTH_BK_ATM_USG_CHGS    29 20000      1.10     14.22      0.00
## AMT_MIN_BAL_NMC_CHGS       30 20000      1.29     14.76      0.00
## NO_OF_IW_CHQ_BNC_TXNS      31 20000      0.04      0.20      0.00
## NO_OF_OW_CHQ_BNC_TXNS      32 20000      0.04      0.21      0.00
## AVG_AMT_PER_ATM_TXN        33 20000   7408.84   7210.17   6000.00
## AVG_AMT_PER_CSH_WDL_TXN    34 20000 242236.48 269837.89 147095.00
## AVG_AMT_PER_CHQ_TXN        35 20000  25092.48  49387.20   8645.00
## AVG_AMT_PER_NET_TXN        36 20000 179059.03 281706.86      0.00
## AVG_AMT_PER_MOB_TXN        37 20000  20303.92  46472.89      0.00
## FLG_HAS_NOMINEE*           38 20000      1.90      0.30      2.00
## FLG_HAS_OLD_LOAN*          39 20000      1.49      0.50      1.00
## random                     40 20000      0.50      0.29      0.51
## LOW_BAL*                   41 20000      1.50      0.50      1.50
## LOW_HOLD*                  42 20000      1.51      0.50      2.00
##                            trimmed       mad min       max     range  skew
## CUST_ID*                  10000.50   7413.00   1   20000.0   19999.0  0.00
## TARGET                        0.03      0.00   0       1.0       1.0  2.26
## AGE                          38.33     11.86  21      55.0      34.0  0.09
## GENDER*                       1.79      0.00   1       3.0       2.0 -0.79
## BALANCE                  353637.08 294970.24   0 8360430.6 8360430.6  2.78
## OCCUPATION*                   2.40      1.48   1       4.0       3.0  0.16
## AGE_BKT*                      4.09      2.97   1       7.0       6.0  0.02
## SCR                         420.92    262.42 100     999.0     899.0  0.56
## HOLDING_PERIOD               14.84     10.38   1      31.0      30.0  0.07
## ACC_TYPE*                     1.86      0.00   1       2.0       1.0 -1.41
## ACC_OP_DATE*                   NaN        NA Inf      -Inf      -Inf    NA
## LEN_OF_RLTN_IN_MNTH         125.26     69.68  29     221.0     192.0  0.00
## NO_OF_L_CR_TXNS              10.01      5.93   0      75.0      75.0  2.46
## NO_OF_L_DR_TXNS               5.21      2.97   0      74.0      74.0  3.92
## TOT_NO_OF_L_TXNS             15.77      8.90   0     149.0     149.0  2.81
## NO_OF_BR_CSH_WDL_DR_TXNS      1.42      1.48   0      15.0      15.0  2.34
## NO_OF_ATM_DR_TXNS             0.87      1.48   0      25.0      25.0  8.47
## NO_OF_NET_DR_TXNS             0.60      0.00   0      22.0      22.0  4.24
## NO_OF_MOB_DR_TXNS             0.16      0.00   0      25.0      25.0 11.02
## NO_OF_CHQ_DR_TXNS             1.75      2.97   0      15.0      15.0  1.56
## FLG_HAS_CC*                   1.26      0.00   1       2.0       1.0  0.84
## AMT_ATM_DR                 7968.07  10229.94   0  199300.0  199300.0  3.65
## AMT_BR_CSH_WDL_DR        356596.13 497871.91   0  999930.0  999930.0  0.31
## AMT_CHQ_DR                33171.50  35345.18   0 4928640.0 4928640.0  7.18
## AMT_NET_DR               185143.02      0.00   0  999854.0  999854.0  1.00
## AMT_MOB_DR                 8796.85      0.00   0  199667.0  199667.0  2.16
## AMT_L_DR                 689894.96 628954.50   0 6514921.0 6514921.0  2.53
## FLG_HAS_ANY_CHGS*             1.01      0.00   1       2.0       1.0  2.48
## AMT_OTH_BK_ATM_USG_CHGS       0.00      0.00   0     250.0     250.0 14.07
## AMT_MIN_BAL_NMC_CHGS          0.00      0.00   0     170.0     170.0 11.34
## NO_OF_IW_CHQ_BNC_TXNS         0.00      0.00   0       2.0       2.0  4.57
## NO_OF_OW_CHQ_BNC_TXNS         0.00      0.00   0       2.0       2.0  4.44
## AVG_AMT_PER_ATM_TXN        6714.08   8895.60   0   25000.0   25000.0  0.51
## AVG_AMT_PER_CSH_WDL_TXN  197101.27 218083.05   0  999640.0  999640.0  1.14
## AVG_AMT_PER_CHQ_TXN       14036.18  12817.08   0  537842.2  537842.2  4.52
## AVG_AMT_PER_NET_TXN      118388.89      0.00   0  999854.0  999854.0  1.50
## AVG_AMT_PER_MOB_TXN        7187.16      0.00   0  199667.0  199667.0  2.34
## FLG_HAS_NOMINEE*              2.00      0.00   1       2.0       1.0 -2.69
## FLG_HAS_OLD_LOAN*             1.49      0.00   1       2.0       1.0  0.03
## random                        0.50      0.37   0       1.0       1.0 -0.02
## LOW_BAL*                      1.50      0.74   1       2.0       1.0  0.00
## LOW_HOLD*                     1.52      0.00   1       2.0       1.0 -0.05
##                          kurtosis      se
## CUST_ID*                    -1.20   40.83
## TARGET                       3.10    0.00
## AGE                         -1.16    0.07
## GENDER*                     -0.61    0.00
## BALANCE                     10.61 5116.57
## OCCUPATION*                 -1.39    0.01
## AGE_BKT*                    -1.12    0.01
## SCR                         -0.94    1.77
## HOLDING_PERIOD              -1.10    0.06
## ACC_TYPE*                   -0.02    0.00
## ACC_OP_DATE*                   NA      NA
## LEN_OF_RLTN_IN_MNTH         -1.18    0.39
## NO_OF_L_CR_TXNS              7.05    0.09
## NO_OF_L_DR_TXNS             23.77    0.05
## TOT_NO_OF_L_TXNS            11.87    0.13
## NO_OF_BR_CSH_WDL_DR_TXNS     6.46    0.02
## NO_OF_ATM_DR_TXNS          102.86    0.01
## NO_OF_NET_DR_TXNS           25.25    0.02
## NO_OF_MOB_DR_TXNS          126.87    0.01
## NO_OF_CHQ_DR_TXNS            3.07    0.02
## FLG_HAS_CC*                 -1.29    0.00
## AMT_ATM_DR                  25.73  108.22
## AMT_BR_CSH_WDL_DR           -1.32 2343.48
## AMT_CHQ_DR                  59.45 3106.88
## AMT_NET_DR                  -0.49 2256.15
## AMT_MOB_DR                   3.39  349.91
## AMT_L_DR                    12.74 5039.26
## FLG_HAS_ANY_CHGS*            4.17    0.00
## AMT_OTH_BK_ATM_USG_CHGS    206.79    0.10
## AMT_MIN_BAL_NMC_CHGS       126.57    0.10
## NO_OF_IW_CHQ_BNC_TXNS       19.27    0.00
## NO_OF_OW_CHQ_BNC_TXNS       17.83    0.00
## AVG_AMT_PER_ATM_TXN         -1.05   50.98
## AVG_AMT_PER_CSH_WDL_TXN      0.30 1908.04
## AVG_AMT_PER_CHQ_TXN         27.72  349.22
## AVG_AMT_PER_NET_TXN          0.92 1991.97
## AVG_AMT_PER_MOB_TXN          4.36  328.61
## FLG_HAS_NOMINEE*             5.23    0.00
## FLG_HAS_OLD_LOAN*           -2.00    0.00
## random                      -1.21    0.00
## LOW_BAL*                    -2.00    0.00
## LOW_HOLD*                   -2.00    0.00
par(mfrow=c(2, 2), oma=c(0,0,3,0))
plot(ploan$BALANCE ~ ploan$TARGET,xlab='TARGET', ylab='BALANCE')
plot(ploan$SCR~ ploan$TARGET,xlab='TARGET', ylab='SCR')
plot(ploan$TOT_NO_OF_L_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='NO_OF_ATM_DR_TXNS')
plot(ploan$NO_OF_ATM_DR_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='TOT_NO_OF_L_TXNS')

plot(ploan$NO_OF_NET_DR_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='NO_OF_NET_DR_TXNS')
plot(ploan$NO_OF_CHQ_DR_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='NO_OF_CHQ_DR_TXNS')
plot(ploan$NO_OF_L_CR_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='NO_OF_L_CR_TXNS')
plot(ploan$HOLDING_PERIOD ~ ploan$TARGET,xlab='TARGET', ylab='HOLDING_PERIOD')

plot(ploan$NO_OF_L_DR_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='NO_OF_L_DR_TXNS')
plot(ploan$AMT_L_DR ~ ploan$TARGET,xlab='TARGET', ylab='AMT_L_DR')
plot(ploan$AMT_BR_CSH_WDL_DR ~ ploan$TARGET,xlab='TARGET', ylab='AMT_BR_CSH_WDL_DR')
plot(ploan$OCCUPATION ~ ploan$TARGET,xlab='TARGET', ylab='OCCUPATION')

plot(ploan$AGE_BKT ~ ploan$TARGET,xlab='TARGET', ylab='AGE_BKT')
plot(ploan$FLG_HAS_CC ~ ploan$TARGET,xlab='TARGET', ylab='FLG_HAS_CC')
plot(ploan$GENDER ~ ploan$TARGET,xlab='TARGET', ylab='GENDER')
plot(ploan$TOT_NO_OF_L_TXNS ~ ploan$TARGET,xlab='TARGET', ylab='TOT_NO_OF_L_TXNS')

boxplot(ploan$BALANCE,main ="BALANCE")
boxplot(ploan$SCR,main ="SCR")
boxplot(ploan$TOT_NO_OF_L_TXNS,main ="TOT_NO_OF_L_TXNS")
boxplot(ploan$NO_OF_L_CR_TXNS,main = "NO_OF_L_CR_TXNS")

boxplot(ploan$NO_OF_ATM_DR_TXNS,main = "NO_OF_ATM_DR_TXNS")
boxplot(ploan$NO_OF_NET_DR_TXNS,main = "NO_OF_NET_DR_TXNS")
boxplot(ploan$NO_OF_CHQ_DR_TXNS,main = "NO_OF_CHQ_DR_TXNS ")
boxplot(ploan$NO_OF_L_CR_TXNS,main = "NO_OF_L_CR_TXNS")

hist(ploan$BALANCE,main ="BALANCE", xlab=NA, ylab=NA)
hist(ploan$SCR,main ="SCR", xlab=NA, ylab=NA)
hist(ploan$TOT_NO_OF_L_TXNS,main ="TOT_NO_OF_L_TXNS", xlab=NA, ylab=NA)
hist(ploan$NO_OF_L_CR_TXNS,main = "NO_OF_L_CR_TXNS", xlab=NA, ylab=NA)

hist(ploan$NO_OF_ATM_DR_TXNS,main ="NO_OF_ATM_DR_TXNS", xlab=NA, ylab=NA)
hist(ploan$NO_OF_NET_DR_TXNS,main ="NO_OF_NET_DR_TXNS", xlab=NA, ylab=NA)
hist(ploan$NO_OF_NET_DR_TXNS,main ="NO_OF_NET_DR_TXNS", xlab=NA, ylab=NA)
hist(ploan$NO_OF_L_CR_TXNS,main ="NO_OF_L_CR_TXNS", xlab=NA, ylab=NA)

boxplot(ploan$HOLDING_PERIOD,main="HOLDING_PERIOD")
boxplot(ploan$NO_OF_L_DR_TXNS,main="NO_OF_L_DR_TXNS")
boxplot(ploan$AMT_L_DR,main="AMT_L_DR")
boxplot(ploan$AMT_BR_CSH_WDL_DR ,main="AMT_BR_CSH_WDL_DR ")

hist(ploan$HOLDING_PERIOD,main="HOLDING_PERIOD", xlab=NA, ylab=NA)
hist(ploan$NO_OF_L_DR_TXNS,main="NO_OF_L_DR_TXNS", xlab=NA, ylab=NA)
hist(ploan$AMT_L_DR,main="AMT_L_DR", xlab=NA, ylab=NA)
hist(ploan$AMT_BR_CSH_WDL_DR ,main="AMT_BR_CSH_WDL_DR ", xlab=NA, ylab=NA)

plot(ploan$OCCUPATION,main="OCCUPATION", xlab=NA, ylab=NA)
plot(ploan$AGE_BKT,main="AGE_BKT", xlab=NA, ylab=NA)
plot(ploan$FLG_HAS_CC,main="FLG_HAS_CC", xlab=NA, ylab=NA)
plot(ploan$GENDER,main="GENDER", xlab=NA, ylab=NA)

Bivariate analysis

library(corrplot)
## Warning: package 'corrplot' was built under R version 3.4.2
## corrplot 0.84 loaded
pl1 <- subset(ploan[c(1,2,4,6,7,10,11,21,28,38,39,41,42)])
pl2 <- subset(ploan[-c(1,2,4,6,7,10,11,21,28,38,39,41,42)])
corx <- cor(pl2)
corrplot(corx,method="circle",tl.cex=0.5)

corx
##                                    AGE       BALANCE           SCR
## AGE                       1.0000000000 -0.1225868887 -0.0058707849
## BALANCE                  -0.1225868887  1.0000000000 -0.0652999838
## SCR                      -0.0058707849 -0.0652999838  1.0000000000
## HOLDING_PERIOD           -0.0120598801  0.0392406960 -0.0251743685
## LEN_OF_RLTN_IN_MNTH      -0.0082792784 -0.0008551526  0.0090335800
## NO_OF_L_CR_TXNS           0.0301702109 -0.0476523126 -0.0131789419
## NO_OF_L_DR_TXNS           0.0196022896 -0.0434309712  0.0093894768
## TOT_NO_OF_L_TXNS          0.0289320084 -0.0512985219 -0.0049522451
## NO_OF_BR_CSH_WDL_DR_TXNS  0.0242658282 -0.0348138188  0.0048274515
## NO_OF_ATM_DR_TXNS         0.0067570308 -0.0305791491  0.0149096786
## NO_OF_NET_DR_TXNS         0.0122679435 -0.0370182529  0.0064761681
## NO_OF_MOB_DR_TXNS         0.0019572951 -0.0210124259  0.0012361580
## NO_OF_CHQ_DR_TXNS         0.0217996747 -0.0325159849  0.0087075107
## AMT_ATM_DR                0.0197021581 -0.0359871389  0.0097440989
## AMT_BR_CSH_WDL_DR         0.0103506920 -0.0209013013 -0.0198408171
## AMT_CHQ_DR                0.0121892929 -0.0125106170  0.0045193167
## AMT_NET_DR                0.0043899298 -0.0293345016  0.0236541198
## AMT_MOB_DR                0.0289084717 -0.0266942619 -0.0125878255
## AMT_L_DR                  0.0167245204 -0.0331931481  0.0034849587
## AMT_OTH_BK_ATM_USG_CHGS  -0.0079800174 -0.0109486772  0.0079019189
## AMT_MIN_BAL_NMC_CHGS      0.0164369225 -0.0618186605  0.0086818985
## NO_OF_IW_CHQ_BNC_TXNS    -0.0144121792 -0.0099343663  0.0008638097
## NO_OF_OW_CHQ_BNC_TXNS    -0.0058303195 -0.0143641666  0.0065411505
## AVG_AMT_PER_ATM_TXN       0.0186923009 -0.0353602872  0.0194400547
## AVG_AMT_PER_CSH_WDL_TXN  -0.0050775478  0.0058067710 -0.0225312148
## AVG_AMT_PER_CHQ_TXN       0.0144561895 -0.0237323732  0.0082671172
## AVG_AMT_PER_NET_TXN       0.0000790903 -0.0191491203  0.0257306992
## AVG_AMT_PER_MOB_TXN       0.0282875621 -0.0287271783 -0.0152461010
## random                   -0.0045172819 -0.0040261584  0.0081308782
##                          HOLDING_PERIOD LEN_OF_RLTN_IN_MNTH
## AGE                        -0.012059880       -8.279278e-03
## BALANCE                     0.039240696       -8.551526e-04
## SCR                        -0.025174369        9.033580e-03
## HOLDING_PERIOD              1.000000000        1.144767e-02
## LEN_OF_RLTN_IN_MNTH         0.011447673        1.000000e+00
## NO_OF_L_CR_TXNS            -0.008474285        2.171897e-02
## NO_OF_L_DR_TXNS            -0.347855164        1.878054e-03
## TOT_NO_OF_L_TXNS           -0.156350280        1.577737e-02
## NO_OF_BR_CSH_WDL_DR_TXNS   -0.196454853       -3.073078e-03
## NO_OF_ATM_DR_TXNS          -0.181790415       -4.713136e-05
## NO_OF_NET_DR_TXNS          -0.250650046        5.920794e-03
## NO_OF_MOB_DR_TXNS          -0.109956056       -3.159358e-03
## NO_OF_CHQ_DR_TXNS          -0.473639299        5.684616e-03
## AMT_ATM_DR                 -0.173627031       -1.001416e-02
## AMT_BR_CSH_WDL_DR          -0.048038366       -1.698567e-03
## AMT_CHQ_DR                 -0.173118109        1.379614e-02
## AMT_NET_DR                 -0.198319400        1.535660e-03
## AMT_MOB_DR                 -0.104096870        4.805786e-03
## AMT_L_DR                   -0.228820720        8.522072e-03
## AMT_OTH_BK_ATM_USG_CHGS    -0.077077830       -6.432491e-03
## AMT_MIN_BAL_NMC_CHGS       -0.006945401       -8.238740e-03
## NO_OF_IW_CHQ_BNC_TXNS      -0.040949546        1.704724e-03
## NO_OF_OW_CHQ_BNC_TXNS      -0.066336851        1.299358e-03
## AVG_AMT_PER_ATM_TXN        -0.167648137       -1.890459e-02
## AVG_AMT_PER_CSH_WDL_TXN     0.053489719        7.646441e-03
## AVG_AMT_PER_CHQ_TXN        -0.209996056        1.290957e-02
## AVG_AMT_PER_NET_TXN        -0.107639295       -2.317134e-03
## AVG_AMT_PER_MOB_TXN        -0.080624988        7.677896e-04
## random                     -0.002089157        3.608765e-03
##                          NO_OF_L_CR_TXNS NO_OF_L_DR_TXNS TOT_NO_OF_L_TXNS
## AGE                          0.030170211     0.019602290      0.028932008
## BALANCE                     -0.047652313    -0.043430971     -0.051298522
## SCR                         -0.013178942     0.009389477     -0.004952245
## HOLDING_PERIOD              -0.008474285    -0.347855164     -0.156350280
## LEN_OF_RLTN_IN_MNTH          0.021718966     0.001878054      0.015777365
## NO_OF_L_CR_TXNS              1.000000000     0.582878327      0.936225572
## NO_OF_L_DR_TXNS              0.582878327     1.000000000      0.831203457
## TOT_NO_OF_L_TXNS             0.936225572     0.831203457      1.000000000
## NO_OF_BR_CSH_WDL_DR_TXNS     0.376076032     0.566710618      0.502432910
## NO_OF_ATM_DR_TXNS            0.478080796     0.806728473      0.675687477
## NO_OF_NET_DR_TXNS            0.543464462     0.915082176      0.767502156
## NO_OF_MOB_DR_TXNS            0.456308736     0.763747602      0.642399104
## NO_OF_CHQ_DR_TXNS            0.286492245     0.608017630      0.459061809
## AMT_ATM_DR                   0.436094319     0.699706523      0.601077738
## AMT_BR_CSH_WDL_DR            0.086326741     0.115308142      0.108965340
## AMT_CHQ_DR                   0.288798124     0.466685679      0.399406743
## AMT_NET_DR                   0.146707618     0.303860430      0.231834834
## AMT_MOB_DR                   0.394123020     0.551017942      0.507941092
## AMT_L_DR                     0.320615158     0.530681849      0.448896195
## AMT_OTH_BK_ATM_USG_CHGS      0.320124519     0.564558279      0.463085674
## AMT_MIN_BAL_NMC_CHGS         0.026631556     0.009876822      0.022458196
## NO_OF_IW_CHQ_BNC_TXNS        0.002825437     0.059746413      0.027804172
## NO_OF_OW_CHQ_BNC_TXNS        0.036371862     0.085200056      0.061762124
## AVG_AMT_PER_ATM_TXN          0.196087423     0.320450157      0.273037974
## AVG_AMT_PER_CSH_WDL_TXN     -0.072480645    -0.138213687     -0.109383160
## AVG_AMT_PER_CHQ_TXN          0.296118646     0.496140739      0.417130807
## AVG_AMT_PER_NET_TXN         -0.070979834    -0.040286627     -0.065890212
## AVG_AMT_PER_MOB_TXN          0.331735967     0.409491099      0.404072540
## random                      -0.006646545    -0.005100748     -0.006643155
##                          NO_OF_BR_CSH_WDL_DR_TXNS NO_OF_ATM_DR_TXNS
## AGE                                   0.024265828      6.757031e-03
## BALANCE                              -0.034813819     -3.057915e-02
## SCR                                   0.004827451      1.490968e-02
## HOLDING_PERIOD                       -0.196454853     -1.817904e-01
## LEN_OF_RLTN_IN_MNTH                  -0.003073078     -4.713136e-05
## NO_OF_L_CR_TXNS                       0.376076032      4.780808e-01
## NO_OF_L_DR_TXNS                       0.566710618      8.067285e-01
## TOT_NO_OF_L_TXNS                      0.502432910      6.756875e-01
## NO_OF_BR_CSH_WDL_DR_TXNS              1.000000000      2.528161e-01
## NO_OF_ATM_DR_TXNS                     0.252816060      1.000000e+00
## NO_OF_NET_DR_TXNS                     0.414579011      7.587912e-01
## NO_OF_MOB_DR_TXNS                     0.168559933      7.737012e-01
## NO_OF_CHQ_DR_TXNS                     0.156116651      3.117335e-01
## AMT_ATM_DR                            0.344833802      7.083088e-01
## AMT_BR_CSH_WDL_DR                     0.320712863      1.054877e-02
## AMT_CHQ_DR                            0.085462604      2.523575e-01
## AMT_NET_DR                            0.173491510      2.288784e-01
## AMT_MOB_DR                            0.464860671      3.326339e-01
## AMT_L_DR                              0.319194885      3.012735e-01
## AMT_OTH_BK_ATM_USG_CHGS              -0.014458881      8.409783e-01
## AMT_MIN_BAL_NMC_CHGS                  0.010882111      3.306876e-03
## NO_OF_IW_CHQ_BNC_TXNS                 0.045698356      3.112818e-02
## NO_OF_OW_CHQ_BNC_TXNS                 0.049474952      5.866894e-02
## AVG_AMT_PER_ATM_TXN                   0.239661040      3.119639e-01
## AVG_AMT_PER_CSH_WDL_TXN              -0.127145035     -1.026635e-01
## AVG_AMT_PER_CHQ_TXN                   0.137317211      2.842338e-01
## AVG_AMT_PER_NET_TXN                  -0.045247021     -1.114357e-02
## AVG_AMT_PER_MOB_TXN                   0.432036996      1.966421e-01
## random                                0.001383773     -2.728814e-03
##                          NO_OF_NET_DR_TXNS NO_OF_MOB_DR_TXNS
## AGE                            0.012267943       0.001957295
## BALANCE                       -0.037018253      -0.021012426
## SCR                            0.006476168       0.001236158
## HOLDING_PERIOD                -0.250650046      -0.109956056
## LEN_OF_RLTN_IN_MNTH            0.005920794      -0.003159358
## NO_OF_L_CR_TXNS                0.543464462       0.456308736
## NO_OF_L_DR_TXNS                0.915082176       0.763747602
## TOT_NO_OF_L_TXNS               0.767502156       0.642399104
## NO_OF_BR_CSH_WDL_DR_TXNS       0.414579011       0.168559933
## NO_OF_ATM_DR_TXNS              0.758791239       0.773701233
## NO_OF_NET_DR_TXNS              1.000000000       0.753339568
## NO_OF_MOB_DR_TXNS              0.753339568       1.000000000
## NO_OF_CHQ_DR_TXNS              0.432361300       0.210224038
## AMT_ATM_DR                     0.640036786       0.537395811
## AMT_BR_CSH_WDL_DR              0.060027161      -0.031144375
## AMT_CHQ_DR                     0.452952997       0.216940442
## AMT_NET_DR                     0.413677540       0.111040021
## AMT_MOB_DR                     0.474324695       0.319453846
## AMT_L_DR                       0.539066983       0.202704988
## AMT_OTH_BK_ATM_USG_CHGS        0.569358116       0.805864033
## AMT_MIN_BAL_NMC_CHGS           0.006654306       0.014441666
## NO_OF_IW_CHQ_BNC_TXNS          0.037649370       0.010777148
## NO_OF_OW_CHQ_BNC_TXNS          0.062208664       0.046850773
## AVG_AMT_PER_ATM_TXN            0.226788266       0.063536037
## AVG_AMT_PER_CSH_WDL_TXN       -0.125559398      -0.093861111
## AVG_AMT_PER_CHQ_TXN            0.486431759       0.232384892
## AVG_AMT_PER_NET_TXN            0.040412931      -0.086132463
## AVG_AMT_PER_MOB_TXN            0.320204432       0.150585721
## random                        -0.002216460      -0.001283732
##                          NO_OF_CHQ_DR_TXNS   AMT_ATM_DR AMT_BR_CSH_WDL_DR
## AGE                           0.0217996747  0.019702158       0.010350692
## BALANCE                      -0.0325159849 -0.035987139      -0.020901301
## SCR                           0.0087075107  0.009744099      -0.019840817
## HOLDING_PERIOD               -0.4736392990 -0.173627031      -0.048038366
## LEN_OF_RLTN_IN_MNTH           0.0056846161 -0.010014162      -0.001698567
## NO_OF_L_CR_TXNS               0.2864922454  0.436094319       0.086326741
## NO_OF_L_DR_TXNS               0.6080176296  0.699706523       0.115308142
## TOT_NO_OF_L_TXNS              0.4590618093  0.601077738       0.108965340
## NO_OF_BR_CSH_WDL_DR_TXNS      0.1561166514  0.344833802       0.320712863
## NO_OF_ATM_DR_TXNS             0.3117334639  0.708308791       0.010548774
## NO_OF_NET_DR_TXNS             0.4323613005  0.640036786       0.060027161
## NO_OF_MOB_DR_TXNS             0.2102240375  0.537395811      -0.031144375
## NO_OF_CHQ_DR_TXNS             1.0000000000  0.381930517       0.025830464
## AMT_ATM_DR                    0.3819305171  1.000000000       0.041550639
## AMT_BR_CSH_WDL_DR             0.0258304639  0.041550639       1.000000000
## AMT_CHQ_DR                    0.6230378798  0.309998601       0.024670558
## AMT_NET_DR                    0.1590108697  0.221944553       0.104824900
## AMT_MOB_DR                    0.3760261233  0.377971600       0.074122864
## AMT_L_DR                      0.5016408908  0.357536594       0.533224860
## AMT_OTH_BK_ATM_USG_CHGS       0.0496839455  0.431459258      -0.054181965
## AMT_MIN_BAL_NMC_CHGS          0.0005051339  0.003875363       0.001265182
## NO_OF_IW_CHQ_BNC_TXNS         0.0823414499  0.037500737       0.042927667
## NO_OF_OW_CHQ_BNC_TXNS         0.0882304908  0.032538929       0.031696090
## AVG_AMT_PER_ATM_TXN           0.3258795124  0.724982307       0.087367371
## AVG_AMT_PER_CSH_WDL_TXN      -0.0540339181 -0.106329710       0.776706032
## AVG_AMT_PER_CHQ_TXN           0.6018441917  0.326789870       0.031137620
## AVG_AMT_PER_NET_TXN          -0.0478749757 -0.017963262       0.080935912
## AVG_AMT_PER_MOB_TXN           0.3347324610  0.281797857       0.082373510
## random                       -0.0127008050 -0.003748107      -0.002808173
##                            AMT_CHQ_DR    AMT_NET_DR    AMT_MOB_DR
## AGE                       0.012189293  0.0043899298  0.0289084717
## BALANCE                  -0.012510617 -0.0293345016 -0.0266942619
## SCR                       0.004519317  0.0236541198 -0.0125878255
## HOLDING_PERIOD           -0.173118109 -0.1983193996 -0.1040968699
## LEN_OF_RLTN_IN_MNTH       0.013796138  0.0015356605  0.0048057857
## NO_OF_L_CR_TXNS           0.288798124  0.1467076180  0.3941230204
## NO_OF_L_DR_TXNS           0.466685679  0.3038604305  0.5510179422
## TOT_NO_OF_L_TXNS          0.399406743  0.2318348343  0.5079410924
## NO_OF_BR_CSH_WDL_DR_TXNS  0.085462604  0.1734915098  0.4648606706
## NO_OF_ATM_DR_TXNS         0.252357473  0.2288783616  0.3326338702
## NO_OF_NET_DR_TXNS         0.452952997  0.4136775398  0.4743246955
## NO_OF_MOB_DR_TXNS         0.216940442  0.1110400208  0.3194538462
## NO_OF_CHQ_DR_TXNS         0.623037880  0.1590108697  0.3760261233
## AMT_ATM_DR                0.309998601  0.2219445527  0.3779716004
## AMT_BR_CSH_WDL_DR         0.024670558  0.1048249003  0.0741228636
## AMT_CHQ_DR                1.000000000  0.1547845811  0.3293078035
## AMT_NET_DR                0.154784581  1.0000000000  0.1161647353
## AMT_MOB_DR                0.329307803  0.1161647353  1.0000000000
## AMT_L_DR                  0.726831006  0.6047251144  0.3670629404
## AMT_OTH_BK_ATM_USG_CHGS   0.064480153  0.0779602866  0.1145090322
## AMT_MIN_BAL_NMC_CHGS     -0.006257877 -0.0006234766  0.0188714317
## NO_OF_IW_CHQ_BNC_TXNS     0.027038765  0.0446767607 -0.0002489512
## NO_OF_OW_CHQ_BNC_TXNS     0.036334694  0.0393407230  0.0268431976
## AVG_AMT_PER_ATM_TXN       0.156373325  0.2338513188  0.1911939468
## AVG_AMT_PER_CSH_WDL_TXN  -0.036469233 -0.0029777271 -0.1402926321
## AVG_AMT_PER_CHQ_TXN       0.904118428  0.1956416760  0.3437716019
## AVG_AMT_PER_NET_TXN      -0.058813641  0.8567920886 -0.1600936064
## AVG_AMT_PER_MOB_TXN       0.268764198  0.0882360434  0.9641983995
## random                   -0.014588125  0.0059192938 -0.0025768599
##                              AMT_L_DR AMT_OTH_BK_ATM_USG_CHGS
## AGE                       0.016724520           -0.0079800174
## BALANCE                  -0.033193148           -0.0109486772
## SCR                       0.003484959            0.0079019189
## HOLDING_PERIOD           -0.228820720           -0.0770778303
## LEN_OF_RLTN_IN_MNTH       0.008522072           -0.0064324907
## NO_OF_L_CR_TXNS           0.320615158            0.3201245188
## NO_OF_L_DR_TXNS           0.530681849            0.5645582793
## TOT_NO_OF_L_TXNS          0.448896195            0.4630856743
## NO_OF_BR_CSH_WDL_DR_TXNS  0.319194885           -0.0144588805
## NO_OF_ATM_DR_TXNS         0.301273547            0.8409783281
## NO_OF_NET_DR_TXNS         0.539066983            0.5693581163
## NO_OF_MOB_DR_TXNS         0.202704988            0.8058640332
## NO_OF_CHQ_DR_TXNS         0.501640891            0.0496839455
## AMT_ATM_DR                0.357536594            0.4314592577
## AMT_BR_CSH_WDL_DR         0.533224860           -0.0541819645
## AMT_CHQ_DR                0.726831006            0.0644801529
## AMT_NET_DR                0.604725114            0.0779602866
## AMT_MOB_DR                0.367062940            0.1145090322
## AMT_L_DR                  1.000000000            0.0666782928
## AMT_OTH_BK_ATM_USG_CHGS   0.066678293            1.0000000000
## AMT_MIN_BAL_NMC_CHGS     -0.002155378            0.0074047711
## NO_OF_IW_CHQ_BNC_TXNS     0.057424091            0.0065801985
## NO_OF_OW_CHQ_BNC_TXNS     0.057317799            0.0420089960
## AVG_AMT_PER_ATM_TXN       0.270583341           -0.0122208608
## AVG_AMT_PER_CSH_WDL_TXN   0.325359596           -0.0490491974
## AVG_AMT_PER_CHQ_TXN       0.690381328            0.0927150459
## AVG_AMT_PER_NET_TXN       0.373473913           -0.0402883178
## AVG_AMT_PER_MOB_TXN       0.316517155           -0.0212487487
## random                   -0.007909288           -0.0002576055
##                          AMT_MIN_BAL_NMC_CHGS NO_OF_IW_CHQ_BNC_TXNS
## AGE                              0.0164369225         -0.0144121792
## BALANCE                         -0.0618186605         -0.0099343663
## SCR                              0.0086818985          0.0008638097
## HOLDING_PERIOD                  -0.0069454006         -0.0409495460
## LEN_OF_RLTN_IN_MNTH             -0.0082387403          0.0017047238
## NO_OF_L_CR_TXNS                  0.0266315558          0.0028254367
## NO_OF_L_DR_TXNS                  0.0098768220          0.0597464134
## TOT_NO_OF_L_TXNS                 0.0224581958          0.0278041719
## NO_OF_BR_CSH_WDL_DR_TXNS         0.0108821107          0.0456983559
## NO_OF_ATM_DR_TXNS                0.0033068757          0.0311281767
## NO_OF_NET_DR_TXNS                0.0066543062          0.0376493698
## NO_OF_MOB_DR_TXNS                0.0144416658          0.0107771477
## NO_OF_CHQ_DR_TXNS                0.0005051339          0.0823414499
## AMT_ATM_DR                       0.0038753628          0.0375007374
## AMT_BR_CSH_WDL_DR                0.0012651818          0.0429276667
## AMT_CHQ_DR                      -0.0062578775          0.0270387654
## AMT_NET_DR                      -0.0006234766          0.0446767607
## AMT_MOB_DR                       0.0188714317         -0.0002489512
## AMT_L_DR                        -0.0021553778          0.0574240912
## AMT_OTH_BK_ATM_USG_CHGS          0.0074047711          0.0065801985
## AMT_MIN_BAL_NMC_CHGS             1.0000000000          0.0241087169
## NO_OF_IW_CHQ_BNC_TXNS            0.0241087169          1.0000000000
## NO_OF_OW_CHQ_BNC_TXNS           -0.0076740076          0.0060161767
## AVG_AMT_PER_ATM_TXN             -0.0010541073          0.0495007799
## AVG_AMT_PER_CSH_WDL_TXN         -0.0089700934          0.0130782914
## AVG_AMT_PER_CHQ_TXN             -0.0107249969          0.0465097592
## AVG_AMT_PER_NET_TXN             -0.0055692355          0.0401768417
## AVG_AMT_PER_MOB_TXN              0.0191151141         -0.0030758287
## random                           0.0031265951         -0.0048168358
##                          NO_OF_OW_CHQ_BNC_TXNS AVG_AMT_PER_ATM_TXN
## AGE                              -0.0058303195         0.018692301
## BALANCE                          -0.0143641666        -0.035360287
## SCR                               0.0065411505         0.019440055
## HOLDING_PERIOD                   -0.0663368508        -0.167648137
## LEN_OF_RLTN_IN_MNTH               0.0012993584        -0.018904591
## NO_OF_L_CR_TXNS                   0.0363718620         0.196087423
## NO_OF_L_DR_TXNS                   0.0852000564         0.320450157
## TOT_NO_OF_L_TXNS                  0.0617621242         0.273037974
## NO_OF_BR_CSH_WDL_DR_TXNS          0.0494749522         0.239661040
## NO_OF_ATM_DR_TXNS                 0.0586689437         0.311963910
## NO_OF_NET_DR_TXNS                 0.0622086641         0.226788266
## NO_OF_MOB_DR_TXNS                 0.0468507732         0.063536037
## NO_OF_CHQ_DR_TXNS                 0.0882304908         0.325879512
## AMT_ATM_DR                        0.0325389289         0.724982307
## AMT_BR_CSH_WDL_DR                 0.0316960899         0.087367371
## AMT_CHQ_DR                        0.0363346938         0.156373325
## AMT_NET_DR                        0.0393407230         0.233851319
## AMT_MOB_DR                        0.0268431976         0.191193947
## AMT_L_DR                          0.0573177987         0.270583341
## AMT_OTH_BK_ATM_USG_CHGS           0.0420089960        -0.012220861
## AMT_MIN_BAL_NMC_CHGS             -0.0076740076        -0.001054107
## NO_OF_IW_CHQ_BNC_TXNS             0.0060161767         0.049500780
## NO_OF_OW_CHQ_BNC_TXNS             1.0000000000         0.030366280
## AVG_AMT_PER_ATM_TXN               0.0303662799         1.000000000
## AVG_AMT_PER_CSH_WDL_TXN           0.0113525559        -0.023336905
## AVG_AMT_PER_CHQ_TXN               0.0729911230         0.176683964
## AVG_AMT_PER_NET_TXN               0.0215107302         0.143489591
## AVG_AMT_PER_MOB_TXN               0.0199930200         0.189097228
## random                           -0.0001959959        -0.007888469
##                          AVG_AMT_PER_CSH_WDL_TXN AVG_AMT_PER_CHQ_TXN
## AGE                                 -0.005077548         0.014456189
## BALANCE                              0.005806771        -0.023732373
## SCR                                 -0.022531215         0.008267117
## HOLDING_PERIOD                       0.053489719        -0.209996056
## LEN_OF_RLTN_IN_MNTH                  0.007646441         0.012909573
## NO_OF_L_CR_TXNS                     -0.072480645         0.296118646
## NO_OF_L_DR_TXNS                     -0.138213687         0.496140739
## TOT_NO_OF_L_TXNS                    -0.109383160         0.417130807
## NO_OF_BR_CSH_WDL_DR_TXNS            -0.127145035         0.137317211
## NO_OF_ATM_DR_TXNS                   -0.102663537         0.284233850
## NO_OF_NET_DR_TXNS                   -0.125559398         0.486431759
## NO_OF_MOB_DR_TXNS                   -0.093861111         0.232384892
## NO_OF_CHQ_DR_TXNS                   -0.054033918         0.601844192
## AMT_ATM_DR                          -0.106329710         0.326789870
## AMT_BR_CSH_WDL_DR                    0.776706032         0.031137620
## AMT_CHQ_DR                          -0.036469233         0.904118428
## AMT_NET_DR                          -0.002977727         0.195641676
## AMT_MOB_DR                          -0.140292632         0.343771602
## AMT_L_DR                             0.325359596         0.690381328
## AMT_OTH_BK_ATM_USG_CHGS             -0.049049197         0.092715046
## AMT_MIN_BAL_NMC_CHGS                -0.008970093        -0.010724997
## NO_OF_IW_CHQ_BNC_TXNS                0.013078291         0.046509759
## NO_OF_OW_CHQ_BNC_TXNS                0.011352556         0.072991123
## AVG_AMT_PER_ATM_TXN                 -0.023336905         0.176683964
## AVG_AMT_PER_CSH_WDL_TXN              1.000000000        -0.043675627
## AVG_AMT_PER_CHQ_TXN                 -0.043675627         1.000000000
## AVG_AMT_PER_NET_TXN                  0.069843066        -0.033329317
## AVG_AMT_PER_MOB_TXN                 -0.125600515         0.289496096
## random                               0.002993618        -0.010437338
##                          AVG_AMT_PER_NET_TXN AVG_AMT_PER_MOB_TXN
## AGE                             0.0000790903        0.0282875621
## BALANCE                        -0.0191491203       -0.0287271783
## SCR                             0.0257306992       -0.0152461010
## HOLDING_PERIOD                 -0.1076392949       -0.0806249880
## LEN_OF_RLTN_IN_MNTH            -0.0023171340        0.0007677896
## NO_OF_L_CR_TXNS                -0.0709798339        0.3317359670
## NO_OF_L_DR_TXNS                -0.0402866267        0.4094910991
## TOT_NO_OF_L_TXNS               -0.0658902116        0.4040725404
## NO_OF_BR_CSH_WDL_DR_TXNS       -0.0452470211        0.4320369958
## NO_OF_ATM_DR_TXNS              -0.0111435684        0.1966421056
## NO_OF_NET_DR_TXNS               0.0404129313        0.3202044323
## NO_OF_MOB_DR_TXNS              -0.0861324629        0.1505857210
## NO_OF_CHQ_DR_TXNS              -0.0478749757        0.3347324610
## AMT_ATM_DR                     -0.0179632619        0.2817978566
## AMT_BR_CSH_WDL_DR               0.0809359115        0.0823735098
## AMT_CHQ_DR                     -0.0588136412        0.2687641979
## AMT_NET_DR                      0.8567920886        0.0882360434
## AMT_MOB_DR                     -0.1600936064        0.9641983995
## AMT_L_DR                        0.3734739128        0.3165171552
## AMT_OTH_BK_ATM_USG_CHGS        -0.0402883178       -0.0212487487
## AMT_MIN_BAL_NMC_CHGS           -0.0055692355        0.0191151141
## NO_OF_IW_CHQ_BNC_TXNS           0.0401768417       -0.0030758287
## NO_OF_OW_CHQ_BNC_TXNS           0.0215107302        0.0199930200
## AVG_AMT_PER_ATM_TXN             0.1434895914        0.1890972281
## AVG_AMT_PER_CSH_WDL_TXN         0.0698430660       -0.1256005147
## AVG_AMT_PER_CHQ_TXN            -0.0333293167        0.2894960959
## AVG_AMT_PER_NET_TXN             1.0000000000       -0.1518724649
## AVG_AMT_PER_MOB_TXN            -0.1518724649        1.0000000000
## random                          0.0064117100       -0.0021431760
##                                 random
## AGE                      -0.0045172819
## BALANCE                  -0.0040261584
## SCR                       0.0081308782
## HOLDING_PERIOD           -0.0020891571
## LEN_OF_RLTN_IN_MNTH       0.0036087650
## NO_OF_L_CR_TXNS          -0.0066465453
## NO_OF_L_DR_TXNS          -0.0051007475
## TOT_NO_OF_L_TXNS         -0.0066431547
## NO_OF_BR_CSH_WDL_DR_TXNS  0.0013837732
## NO_OF_ATM_DR_TXNS        -0.0027288136
## NO_OF_NET_DR_TXNS        -0.0022164604
## NO_OF_MOB_DR_TXNS        -0.0012837317
## NO_OF_CHQ_DR_TXNS        -0.0127008050
## AMT_ATM_DR               -0.0037481072
## AMT_BR_CSH_WDL_DR        -0.0028081725
## AMT_CHQ_DR               -0.0145881249
## AMT_NET_DR                0.0059192938
## AMT_MOB_DR               -0.0025768599
## AMT_L_DR                 -0.0079092875
## AMT_OTH_BK_ATM_USG_CHGS  -0.0002576055
## AMT_MIN_BAL_NMC_CHGS      0.0031265951
## NO_OF_IW_CHQ_BNC_TXNS    -0.0048168358
## NO_OF_OW_CHQ_BNC_TXNS    -0.0001959959
## AVG_AMT_PER_ATM_TXN      -0.0078884687
## AVG_AMT_PER_CSH_WDL_TXN   0.0029936185
## AVG_AMT_PER_CHQ_TXN      -0.0104373377
## AVG_AMT_PER_NET_TXN       0.0064117100
## AVG_AMT_PER_MOB_TXN      -0.0021431760
## random                    1.0000000000

Splittting the data into 70% and 30%

library(caret)
## Warning: package 'caret' was built under R version 3.4.3
## Loading required package: lattice
## Loading required package: ggplot2
## 
## Attaching package: 'ggplot2'
## The following objects are masked from 'package:psych':
## 
##     %+%, alpha
index <- createDataPartition(ploan$TARGET, p=0.70, list=FALSE)
train <- ploan[ index,]
test <- ploan[-index,]

Node size should be 1-2% of the development sample

library(randomForest)
## Warning: package 'randomForest' was built under R version 3.4.2
## randomForest 4.6-12
## Type rfNews() to see new features/changes/bug fixes.
## 
## Attaching package: 'randomForest'
## The following object is masked from 'package:ggplot2':
## 
##     margin
## The following object is masked from 'package:psych':
## 
##     outlier

Optimal number of trees is 25

Tuning Random Forest, finding the optimal number of m

tRF2 <- tuneRF(x = train[,-c(1,2)], 
              y=as.factor(train$TARGET),
              mtryStart = 3, 
              ntreeTry=25, 
              stepFactor = 1.5, 
              improve = 0.001, 
              trace=TRUE, 
              plot = TRUE,
              doBest = TRUE,
              nodesize = 100, 
              importance=TRUE
)
## mtry = 3  OOB error = 12.22% 
## Searching left ...
## mtry = 2     OOB error = 12.29% 
## -0.005260082 0.001 
## Searching right ...
## mtry = 4     OOB error = 12.12% 
## 0.00818235 0.001 
## mtry = 6     OOB error = 11.96% 
## 0.01296405 0.001 
## mtry = 9     OOB error = 11.87% 
## 0.007761194 0.001 
## mtry = 13    OOB error = 11.75% 
## 0.01015794 0.001 
## mtry = 19    OOB error = 11.74% 
## 0.001287147 0.001 
## mtry = 28    OOB error = 11.66% 
## 0.00669507 0.001 
## mtry = 40    OOB error = 11.61% 
## 0.004218088 0.001

using tuneRF found m as 13

print(tRF2)
## 
## Call:
##  randomForest(x = x, y = y, mtry = res[which.min(res[, 2]), 1],      nodesize = 100, importance = TRUE) 
##                Type of random forest: classification
##                      Number of trees: 500
## No. of variables tried at each split: 40
## 
##         OOB estimate of  error rate: 11.61%
## Confusion matrix:
##       0   1 class.error
## 0 12237  31 0.002526899
## 1  1595 137 0.920900693
plot(tRF2, main="")
legend("topright", c("OOB", "0", "1"), text.col=1:6, lty=1:3, col=1:3)
title(main="Error Rates Random Forest RFDF.dev")

tRF2$importance
##                                      0             1 MeanDecreaseAccuracy
## AGE                       1.018293e-03  4.892221e-03         1.496210e-03
## GENDER                    1.147883e-03  3.202941e-03         1.401051e-03
## BALANCE                   2.498618e-03  3.135466e-02         6.063722e-03
## OCCUPATION                3.482819e-03  2.556256e-02         6.210751e-03
## AGE_BKT                   1.502607e-03  1.252907e-02         2.866081e-03
## SCR                       3.393084e-03  3.035856e-02         6.724208e-03
## HOLDING_PERIOD            1.946641e-02  1.921907e-02         1.943840e-02
## ACC_TYPE                  7.344651e-04  1.489373e-04         6.609152e-04
## ACC_OP_DATE               4.107715e-03  5.072407e-03         4.223463e-03
## LEN_OF_RLTN_IN_MNTH       3.224285e-03 -4.805475e-04         2.764136e-03
## NO_OF_L_CR_TXNS           3.243441e-02 -8.949877e-03         2.731652e-02
## NO_OF_L_DR_TXNS           9.381195e-02 -2.663333e-02         7.893805e-02
## TOT_NO_OF_L_TXNS          3.703274e-02 -2.177546e-02         2.978365e-02
## NO_OF_BR_CSH_WDL_DR_TXNS  2.199687e-03  1.799596e-03         2.150081e-03
## NO_OF_ATM_DR_TXNS         2.587951e-02 -1.456011e-02         2.088901e-02
## NO_OF_NET_DR_TXNS         8.486262e-04 -3.548047e-04         7.001810e-04
## NO_OF_MOB_DR_TXNS         5.493343e-04 -3.115659e-04         4.424556e-04
## NO_OF_CHQ_DR_TXNS         4.281624e-03 -2.150697e-04         3.724991e-03
## FLG_HAS_CC                2.614018e-03  1.944593e-02         4.694556e-03
## AMT_ATM_DR                1.160043e-02  1.138020e-04         1.016776e-02
## AMT_BR_CSH_WDL_DR         6.027803e-03  3.678128e-03         5.734477e-03
## AMT_CHQ_DR                6.691233e-03 -3.370808e-04         5.825329e-03
## AMT_NET_DR                2.092071e-03  7.649549e-04         1.925363e-03
## AMT_MOB_DR                2.915398e-03 -7.366642e-04         2.458838e-03
## AMT_L_DR                  2.086338e-02 -8.752214e-03         1.720980e-02
## FLG_HAS_ANY_CHGS          1.067064e-04  2.379925e-04         1.231093e-04
## AMT_OTH_BK_ATM_USG_CHGS  -7.595654e-06  5.837013e-05         8.010807e-07
## AMT_MIN_BAL_NMC_CHGS      3.107518e-06  5.064522e-05         8.980494e-06
## NO_OF_IW_CHQ_BNC_TXNS     6.920842e-05  3.899875e-04         1.091865e-04
## NO_OF_OW_CHQ_BNC_TXNS     2.495608e-05  4.244435e-04         7.433764e-05
## AVG_AMT_PER_ATM_TXN       9.080786e-03 -8.552783e-04         7.847931e-03
## AVG_AMT_PER_CSH_WDL_TXN   5.559868e-03  9.484557e-04         4.991598e-03
## AVG_AMT_PER_CHQ_TXN       8.952852e-03 -2.280435e-03         7.567514e-03
## AVG_AMT_PER_NET_TXN       2.644861e-03  5.786227e-04         2.386537e-03
## AVG_AMT_PER_MOB_TXN       1.706737e-03  4.234294e-03         2.014644e-03
## FLG_HAS_NOMINEE           5.001393e-05  1.374494e-04         6.097462e-05
## FLG_HAS_OLD_LOAN          6.692224e-06  1.583228e-04         2.527735e-05
## random                    3.352413e-05  7.559321e-04         1.230970e-04
## LOW_BAL                   0.000000e+00  0.000000e+00         0.000000e+00
## LOW_HOLD                  0.000000e+00  0.000000e+00         0.000000e+00
##                          MeanDecreaseGini
## AGE                            22.6424421
## GENDER                         14.4373147
## BALANCE                        77.3519660
## OCCUPATION                     40.9323883
## AGE_BKT                        37.9694162
## SCR                            78.4414355
## HOLDING_PERIOD                 56.5717561
## ACC_TYPE                        3.1901887
## ACC_OP_DATE                    43.6354960
## LEN_OF_RLTN_IN_MNTH            15.5469130
## NO_OF_L_CR_TXNS                55.8492979
## NO_OF_L_DR_TXNS                49.1277270
## TOT_NO_OF_L_TXNS               48.0896195
## NO_OF_BR_CSH_WDL_DR_TXNS       13.3763557
## NO_OF_ATM_DR_TXNS              17.9420072
## NO_OF_NET_DR_TXNS               2.1800071
## NO_OF_MOB_DR_TXNS               1.3794476
## NO_OF_CHQ_DR_TXNS              10.3413527
## FLG_HAS_CC                     21.7606289
## AMT_ATM_DR                     29.7490316
## AMT_BR_CSH_WDL_DR              34.5492091
## AMT_CHQ_DR                     21.0375430
## AMT_NET_DR                     14.2695808
## AMT_MOB_DR                     10.5347242
## AMT_L_DR                       35.7047485
## FLG_HAS_ANY_CHGS                2.8727688
## AMT_OTH_BK_ATM_USG_CHGS         0.2697427
## AMT_MIN_BAL_NMC_CHGS            0.3414494
## NO_OF_IW_CHQ_BNC_TXNS           3.2658671
## NO_OF_OW_CHQ_BNC_TXNS           2.5520463
## AVG_AMT_PER_ATM_TXN            28.0863935
## AVG_AMT_PER_CSH_WDL_TXN        28.2169823
## AVG_AMT_PER_CHQ_TXN            22.0183368
## AVG_AMT_PER_NET_TXN            18.7041979
## AVG_AMT_PER_MOB_TXN            20.0389305
## FLG_HAS_NOMINEE                 1.2584349
## FLG_HAS_OLD_LOAN                1.5522024
## random                         23.0425189
## LOW_BAL                         0.0000000
## LOW_HOLD                        0.0000000

List the importance of the variables

impVar <- round(randomForest::importance(tRF2), 2)
impVar[order(impVar[,4], decreasing=TRUE),]
##                              0      1 MeanDecreaseAccuracy
## SCR                      27.76  43.17                42.69
## BALANCE                  21.38  41.49                39.35
## HOLDING_PERIOD           27.25  21.93                32.67
## NO_OF_L_CR_TXNS          25.84  -7.01                27.76
## NO_OF_L_DR_TXNS          35.08 -13.86                36.03
## TOT_NO_OF_L_TXNS         23.03 -11.31                24.61
## ACC_OP_DATE              12.86  10.92                16.46
## OCCUPATION               25.86  34.25                36.67
## AGE_BKT                  16.36  25.63                26.51
## AMT_L_DR                 33.54 -15.04                34.68
## AMT_BR_CSH_WDL_DR        15.37   8.77                17.59
## AMT_ATM_DR               18.36   0.15                19.94
## AVG_AMT_PER_CSH_WDL_TXN  14.72   2.68                16.19
## AVG_AMT_PER_ATM_TXN      17.87  -1.49                19.53
## random                    1.01   6.35                 3.83
## AGE                      13.69  15.36                18.71
## AVG_AMT_PER_CHQ_TXN      21.61  -5.70                22.48
## FLG_HAS_CC               28.08  36.80                38.79
## AMT_CHQ_DR               14.87  -0.78                15.81
## AVG_AMT_PER_MOB_TXN       5.60  11.04                 8.23
## AVG_AMT_PER_NET_TXN       9.27   2.47                10.00
## NO_OF_ATM_DR_TXNS        26.71 -21.80                26.57
## LEN_OF_RLTN_IN_MNTH      10.35  -1.31                11.46
## GENDER                   17.17  20.48                22.67
## AMT_NET_DR                8.46   3.08                 9.59
## NO_OF_BR_CSH_WDL_DR_TXNS 12.36   6.09                14.68
## AMT_MOB_DR                6.86  -1.34                 7.82
## NO_OF_CHQ_DR_TXNS        12.17  -0.53                13.16
## NO_OF_IW_CHQ_BNC_TXNS     4.49   6.61                 6.68
## ACC_TYPE                  5.87   1.33                 6.31
## FLG_HAS_ANY_CHGS          6.52   4.65                 7.32
## NO_OF_OW_CHQ_BNC_TXNS     1.55   5.95                 4.65
## NO_OF_NET_DR_TXNS         8.50  -2.93                 8.97
## FLG_HAS_OLD_LOAN          0.76   3.02                 2.52
## NO_OF_MOB_DR_TXNS         3.75  -1.82                 4.06
## FLG_HAS_NOMINEE           3.54   3.00                 4.07
## AMT_MIN_BAL_NMC_CHGS      1.09   2.65                 2.80
## AMT_OTH_BK_ATM_USG_CHGS  -2.62   2.91                 0.33
## LOW_BAL                   0.00   0.00                 0.00
## LOW_HOLD                  0.00   0.00                 0.00
##                          MeanDecreaseGini
## SCR                                 78.44
## BALANCE                             77.35
## HOLDING_PERIOD                      56.57
## NO_OF_L_CR_TXNS                     55.85
## NO_OF_L_DR_TXNS                     49.13
## TOT_NO_OF_L_TXNS                    48.09
## ACC_OP_DATE                         43.64
## OCCUPATION                          40.93
## AGE_BKT                             37.97
## AMT_L_DR                            35.70
## AMT_BR_CSH_WDL_DR                   34.55
## AMT_ATM_DR                          29.75
## AVG_AMT_PER_CSH_WDL_TXN             28.22
## AVG_AMT_PER_ATM_TXN                 28.09
## random                              23.04
## AGE                                 22.64
## AVG_AMT_PER_CHQ_TXN                 22.02
## FLG_HAS_CC                          21.76
## AMT_CHQ_DR                          21.04
## AVG_AMT_PER_MOB_TXN                 20.04
## AVG_AMT_PER_NET_TXN                 18.70
## NO_OF_ATM_DR_TXNS                   17.94
## LEN_OF_RLTN_IN_MNTH                 15.55
## GENDER                              14.44
## AMT_NET_DR                          14.27
## NO_OF_BR_CSH_WDL_DR_TXNS            13.38
## AMT_MOB_DR                          10.53
## NO_OF_CHQ_DR_TXNS                   10.34
## NO_OF_IW_CHQ_BNC_TXNS                3.27
## ACC_TYPE                             3.19
## FLG_HAS_ANY_CHGS                     2.87
## NO_OF_OW_CHQ_BNC_TXNS                2.55
## NO_OF_NET_DR_TXNS                    2.18
## FLG_HAS_OLD_LOAN                     1.55
## NO_OF_MOB_DR_TXNS                    1.38
## FLG_HAS_NOMINEE                      1.26
## AMT_MIN_BAL_NMC_CHGS                 0.34
## AMT_OTH_BK_ATM_USG_CHGS              0.27
## LOW_BAL                              0.00
## LOW_HOLD                             0.00
varImpPlot(tRF2,
           sort = T,
           main="Variable Importance",
           n.var=13)

Scoring syntax

train$predict.class <- predict(tRF2,train, type="class")
train$predict.score <- predict(tRF2,train, type="prob")
class(train$predict.score)
## [1] "matrix" "votes"

deciling

decile <- function(x){
  deciles <- vector(length=10)
  for (i in seq(0.1,1,.1)){
    deciles[i*10] <- quantile(x, i, na.rm=T)
  }
  return (
    ifelse(x<deciles[1], 1,
           ifelse(x<deciles[2], 2,
                  ifelse(x<deciles[3], 3,
                         ifelse(x<deciles[4], 4,
                                ifelse(x<deciles[5], 5,
                                       ifelse(x<deciles[6], 6,
                                              ifelse(x<deciles[7], 7,
                                                     ifelse(x<deciles[8], 8,
                                                            ifelse(x<deciles[9], 9, 10
                                                            ))))))))))
}


train$deciles <- decile(train$predict.score[,2])

Rank Ordering

library(data.table)
tmp_DT = data.table(train)
rank <- tmp_DT[, list(
  cnt = length(TARGET), 
  cnt_resp = sum(TARGET), 
  cnt_non_resp = sum(TARGET == 0)) , 
  by=deciles][order(-deciles)]
rank$rrate <- round (rank$cnt_resp / rank$cnt,2);
rank$cum_resp <- cumsum(rank$cnt_resp)
rank$cum_non_resp <- cumsum(rank$cnt_non_resp)
rank$cum_rel_resp <- round(rank$cum_resp / sum(rank$cnt_resp),2);
rank$cum_rel_non_resp <- round(rank$cum_non_resp / sum(rank$cnt_non_resp),2);
rank$ks <- abs(rank$cum_rel_resp - rank$cum_rel_non_resp);


library(scales)
## 
## Attaching package: 'scales'
## The following objects are masked from 'package:psych':
## 
##     alpha, rescale
rank$rrate <- percent(rank$rrate)
rank$cum_rel_resp <- percent(rank$cum_rel_resp)
rank$cum_rel_non_resp <- percent(rank$cum_rel_non_resp)

View(rank)
library(ROCR)
## Warning: package 'ROCR' was built under R version 3.4.3
## Loading required package: gplots
## Warning: package 'gplots' was built under R version 3.4.3
## 
## Attaching package: 'gplots'
## The following object is masked from 'package:stats':
## 
##     lowess
pred <- prediction(train$predict.score[,2], train$TARGET)
perf <- performance(pred, "tpr", "fpr")
KS <- max(attr(perf, 'y.values')[[1]]-attr(perf, 'x.values')[[1]])
KS
## [1] 0.7546218
perf
## An object of class "performance"
## Slot "x.name":
## [1] "False positive rate"
## 
## Slot "y.name":
## [1] "True positive rate"
## 
## Slot "alpha.name":
## [1] "Cutoff"
## 
## Slot "x.values":
## [[1]]
##   [1] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##   [6] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [11] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [16] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [21] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [26] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [31] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [36] 0.000000e+00 0.000000e+00 0.000000e+00 8.151288e-05 8.151288e-05
##  [41] 8.151288e-05 1.630258e-04 2.445386e-04 2.445386e-04 2.445386e-04
##  [46] 2.445386e-04 2.445386e-04 2.445386e-04 3.260515e-04 4.075644e-04
##  [51] 4.075644e-04 4.075644e-04 4.075644e-04 4.075644e-04 4.075644e-04
##  [56] 4.890773e-04 4.890773e-04 4.890773e-04 5.705902e-04 5.705902e-04
##  [61] 5.705902e-04 5.705902e-04 5.705902e-04 7.336159e-04 7.336159e-04
##  [66] 8.151288e-04 8.151288e-04 8.151288e-04 8.151288e-04 8.151288e-04
##  [71] 8.151288e-04 8.966417e-04 8.966417e-04 9.781545e-04 9.781545e-04
##  [76] 1.141180e-03 1.141180e-03 1.141180e-03 1.141180e-03 1.141180e-03
##  [81] 1.141180e-03 1.141180e-03 1.141180e-03 1.222693e-03 1.222693e-03
##  [86] 1.222693e-03 1.304206e-03 1.385719e-03 1.385719e-03 1.385719e-03
##  [91] 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03
##  [96] 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03
## [101] 1.467232e-03 1.467232e-03 1.467232e-03 1.548745e-03 1.630258e-03
## [106] 1.630258e-03 1.630258e-03 1.630258e-03 1.630258e-03 1.630258e-03
## [111] 1.711770e-03 1.711770e-03 1.956309e-03 1.956309e-03 1.956309e-03
## [116] 1.956309e-03 2.119335e-03 2.119335e-03 2.119335e-03 2.119335e-03
## [121] 2.200848e-03 2.200848e-03 2.282361e-03 2.445386e-03 2.445386e-03
## [126] 2.445386e-03 2.526899e-03 2.526899e-03 2.689925e-03 2.852951e-03
## [131] 2.852951e-03 2.852951e-03 3.015977e-03 3.342028e-03 3.423541e-03
## [136] 3.505054e-03 3.505054e-03 3.505054e-03 3.505054e-03 3.505054e-03
## [141] 3.505054e-03 3.505054e-03 3.505054e-03 3.505054e-03 3.586567e-03
## [146] 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03
## [151] 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03
## [156] 3.831105e-03 3.831105e-03 3.831105e-03 3.831105e-03 3.831105e-03
## [161] 3.831105e-03 3.912618e-03 4.238670e-03 4.320183e-03 4.320183e-03
## [166] 4.320183e-03 4.483208e-03 4.564721e-03 4.564721e-03 4.646234e-03
## [171] 4.646234e-03 4.646234e-03 4.727747e-03 4.809260e-03 4.809260e-03
## [176] 4.809260e-03 4.890773e-03 4.972286e-03 5.135311e-03 5.298337e-03
## [181] 5.461363e-03 5.542876e-03 5.624389e-03 5.950440e-03 6.194979e-03
## [186] 6.602543e-03 6.602543e-03 6.684056e-03 6.928595e-03 7.254646e-03
## [191] 7.336159e-03 7.662211e-03 7.743724e-03 8.151288e-03 8.232801e-03
## [196] 8.640365e-03 8.721878e-03 8.803391e-03 8.966417e-03 9.047930e-03
## [201] 9.129442e-03 9.373981e-03 9.537007e-03 9.618520e-03 9.700033e-03
## [206] 9.781545e-03 9.863058e-03 9.863058e-03 9.944571e-03 1.018911e-02
## [211] 1.035214e-02 1.059667e-02 1.116726e-02 1.124878e-02 1.141180e-02
## [216] 1.149332e-02 1.190088e-02 1.198239e-02 1.238996e-02 1.263450e-02
## [221] 1.271601e-02 1.312357e-02 1.344963e-02 1.393870e-02 1.418324e-02
## [226] 1.459081e-02 1.483534e-02 1.507988e-02 1.532442e-02 1.565047e-02
## [231] 1.589501e-02 1.646560e-02 1.662863e-02 1.744376e-02 1.817737e-02
## [236] 1.866645e-02 1.923704e-02 1.948158e-02 1.980763e-02 2.037822e-02
## [241] 2.086730e-02 2.184545e-02 2.257907e-02 2.266058e-02 2.282361e-02
## [246] 2.314966e-02 2.461689e-02 2.486143e-02 2.535051e-02 2.608412e-02
## [251] 2.657320e-02 2.804043e-02 2.918161e-02 2.975220e-02 3.089338e-02
## [256] 3.179002e-02 3.325725e-02 3.382784e-02 3.439843e-02 3.594718e-02
## [261] 3.716987e-02 3.798500e-02 3.904467e-02 4.034888e-02 4.165308e-02
## [266] 4.295729e-02 4.401695e-02 4.475057e-02 4.572873e-02 4.703293e-02
## [271] 4.817411e-02 4.988588e-02 5.119009e-02 5.273883e-02 5.396153e-02
## [276] 5.510271e-02 5.640691e-02 5.803717e-02 5.901532e-02 6.048256e-02
## [281] 6.170525e-02 6.260189e-02 6.496576e-02 6.708510e-02 6.977502e-02
## [286] 7.140528e-02 7.311705e-02 7.458428e-02 7.548093e-02 7.800783e-02
## [291] 8.020867e-02 8.289860e-02 8.518096e-02 8.697424e-02 9.072383e-02
## [296] 9.341376e-02 9.553309e-02 9.765243e-02 1.000163e-01 1.032768e-01
## [301] 1.076785e-01 1.113466e-01 1.147701e-01 1.184382e-01 1.226769e-01
## [306] 1.270786e-01 1.305836e-01 1.354744e-01 1.411803e-01 1.460711e-01
## [311] 1.526736e-01 1.586241e-01 1.642485e-01 1.696283e-01 1.781872e-01
## [316] 1.847897e-01 1.924519e-01 2.014183e-01 2.123410e-01 2.208999e-01
## [321] 2.316596e-01 2.451907e-01 2.552983e-01 2.698076e-01 2.865178e-01
## [326] 3.042876e-01 3.218128e-01 3.420280e-01 3.672970e-01 3.937072e-01
## [331] 4.231334e-01 4.575318e-01 4.968210e-01 5.454842e-01 6.054777e-01
## [336] 6.755787e-01 7.791816e-01 1.000000e+00
## 
## 
## Slot "y.values":
## [[1]]
##   [1] 0.000000000 0.002886836 0.003464203 0.005196305 0.008083141
##   [6] 0.009237875 0.009815242 0.010392610 0.010969977 0.012124711
##  [11] 0.013856813 0.014434180 0.015588915 0.016166282 0.018475751
##  [16] 0.020785219 0.021362587 0.021939954 0.022517321 0.025981524
##  [21] 0.026558891 0.027136259 0.029445727 0.030600462 0.031177829
##  [26] 0.031755196 0.032332564 0.032909931 0.034064665 0.034642032
##  [31] 0.035219400 0.037528868 0.040993072 0.041570439 0.042725173
##  [36] 0.044457275 0.047921478 0.048498845 0.050808314 0.052540416
##  [41] 0.054849885 0.054849885 0.056004619 0.056581986 0.057736721
##  [46] 0.058314088 0.058891455 0.060046189 0.060623557 0.061778291
##  [51] 0.062355658 0.062933025 0.063510393 0.064665127 0.065819861
##  [56] 0.065819861 0.066397229 0.066974596 0.068706697 0.069284065
##  [61] 0.069861432 0.071016166 0.071593533 0.073325635 0.074480370
##  [66] 0.075057737 0.075635104 0.077367206 0.078521940 0.081408776
##  [71] 0.081986143 0.083718245 0.084872979 0.088337182 0.089491917
##  [76] 0.089491917 0.090646651 0.092956120 0.093533487 0.094688222
##  [81] 0.095265589 0.095842956 0.097575058 0.098152425 0.098729792
##  [86] 0.100461894 0.102771363 0.103348730 0.106235566 0.107967667
##  [91] 0.107967667 0.112009238 0.113163972 0.117205543 0.117782910
##  [96] 0.118937644 0.119515012 0.121247113 0.123556582 0.124711316
## [101] 0.125288684 0.126443418 0.127020785 0.128752887 0.131062356
## [106] 0.132217090 0.134526559 0.135681293 0.136258661 0.139722864
## [111] 0.140877598 0.142032333 0.142032333 0.142609700 0.144919169
## [116] 0.146651270 0.146651270 0.148960739 0.151270208 0.152424942
## [121] 0.152424942 0.153002309 0.155311778 0.157621247 0.158775982
## [126] 0.162240185 0.163394919 0.163972286 0.168591224 0.169745958
## [131] 0.171478060 0.176096998 0.178983834 0.181293303 0.184180139
## [136] 0.185334873 0.185912240 0.187644342 0.188221709 0.192263279
## [141] 0.195150115 0.196304850 0.197459584 0.198614319 0.199769053
## [146] 0.199769053 0.203233256 0.206120092 0.207852194 0.210161663
## [151] 0.211893764 0.214203233 0.217090069 0.218822171 0.219399538
## [156] 0.221709007 0.223441109 0.224595843 0.225173210 0.227482679
## [161] 0.232101617 0.233833718 0.236143187 0.237297921 0.239607390
## [166] 0.242494226 0.248845266 0.252309469 0.254618938 0.258083141
## [171] 0.261547344 0.267898383 0.270785219 0.273094688 0.276558891
## [176] 0.279445727 0.285796767 0.290993072 0.293879908 0.300230947
## [181] 0.306581986 0.308891455 0.313510393 0.316397229 0.318129330
## [186] 0.320438799 0.322748268 0.325635104 0.325635104 0.331408776
## [191] 0.337182448 0.340646651 0.341801386 0.343533487 0.344688222
## [196] 0.346997691 0.351039261 0.356235566 0.358545035 0.360277136
## [201] 0.361431871 0.362586605 0.367205543 0.370669746 0.375866051
## [206] 0.380484988 0.381639723 0.383949192 0.387413395 0.390877598
## [211] 0.392032333 0.397228637 0.400115473 0.404734411 0.406466513
## [216] 0.412817552 0.418013857 0.419745958 0.428406467 0.431293303
## [221] 0.433602771 0.438799076 0.442840647 0.443995381 0.448036952
## [226] 0.451501155 0.455542725 0.464780600 0.468244804 0.477482679
## [231] 0.483256351 0.487875289 0.491339492 0.495381062 0.499422633
## [236] 0.501154734 0.502886836 0.506351039 0.508660508 0.509237875
## [241] 0.513856813 0.515011547 0.521362587 0.525981524 0.531177829
## [246] 0.535796767 0.540993072 0.550230947 0.554849885 0.564087760
## [251] 0.568129330 0.575057737 0.577944573 0.581986143 0.587182448
## [256] 0.591801386 0.595265589 0.599307159 0.600461894 0.602771363
## [261] 0.608545035 0.613741339 0.623556582 0.631639723 0.636258661
## [266] 0.643187067 0.647806005 0.656466513 0.661085450 0.665704388
## [271] 0.670900693 0.678983834 0.686489607 0.691685912 0.699769053
## [276] 0.706697460 0.710739030 0.713048499 0.715935335 0.721131640
## [281] 0.725750577 0.732101617 0.737297921 0.742494226 0.749422633
## [286] 0.753464203 0.756351039 0.758660508 0.762702079 0.767898383
## [291] 0.772517321 0.777713626 0.782909931 0.790993072 0.798498845
## [296] 0.808314088 0.813510393 0.821016166 0.829099307 0.834872979
## [301] 0.840069284 0.851039261 0.859699769 0.867782910 0.871824480
## [306] 0.876443418 0.882794457 0.886258661 0.894919169 0.900692841
## [311] 0.904734411 0.909353349 0.911662818 0.919168591 0.924942263
## [316] 0.931870670 0.937066975 0.941685912 0.949769053 0.954387991
## [321] 0.960739030 0.963048499 0.966512702 0.974018476 0.976905312
## [326] 0.980946882 0.984411085 0.987875289 0.990762125 0.992494226
## [331] 0.994803695 0.995958430 0.997690531 0.997690531 0.998267898
## [336] 0.998845266 0.999422633 1.000000000
## 
## 
## Slot "alpha.values":
## [[1]]
##   [1]   Inf 0.950 0.876 0.874 0.856 0.852 0.838 0.836 0.808 0.802 0.800
##  [12] 0.794 0.766 0.756 0.752 0.748 0.746 0.740 0.736 0.732 0.730 0.726
##  [23] 0.724 0.722 0.720 0.718 0.714 0.712 0.710 0.708 0.706 0.704 0.702
##  [34] 0.698 0.694 0.688 0.686 0.684 0.682 0.680 0.678 0.668 0.664 0.656
##  [45] 0.652 0.646 0.644 0.640 0.638 0.636 0.634 0.628 0.624 0.622 0.620
##  [56] 0.618 0.616 0.614 0.612 0.610 0.608 0.606 0.604 0.588 0.586 0.584
##  [67] 0.582 0.580 0.578 0.576 0.574 0.572 0.570 0.566 0.564 0.562 0.560
##  [78] 0.558 0.554 0.552 0.550 0.548 0.546 0.544 0.538 0.532 0.530 0.526
##  [89] 0.522 0.520 0.518 0.512 0.510 0.508 0.504 0.502 0.500 0.498 0.496
## [100] 0.490 0.488 0.486 0.484 0.482 0.480 0.476 0.474 0.472 0.470 0.468
## [111] 0.466 0.462 0.460 0.458 0.456 0.454 0.452 0.448 0.446 0.442 0.440
## [122] 0.438 0.436 0.434 0.432 0.430 0.428 0.426 0.422 0.420 0.418 0.416
## [133] 0.414 0.412 0.410 0.408 0.406 0.404 0.402 0.400 0.398 0.396 0.394
## [144] 0.392 0.390 0.388 0.386 0.384 0.382 0.380 0.378 0.376 0.374 0.372
## [155] 0.370 0.368 0.366 0.364 0.362 0.360 0.358 0.356 0.354 0.352 0.346
## [166] 0.344 0.342 0.340 0.338 0.336 0.334 0.332 0.330 0.328 0.326 0.324
## [177] 0.322 0.320 0.318 0.316 0.314 0.312 0.310 0.308 0.306 0.304 0.302
## [188] 0.300 0.298 0.296 0.294 0.292 0.290 0.288 0.286 0.284 0.282 0.280
## [199] 0.278 0.276 0.274 0.272 0.270 0.268 0.266 0.264 0.262 0.260 0.258
## [210] 0.256 0.254 0.252 0.250 0.248 0.246 0.244 0.242 0.240 0.238 0.236
## [221] 0.234 0.232 0.230 0.228 0.226 0.224 0.222 0.220 0.218 0.216 0.214
## [232] 0.212 0.210 0.208 0.206 0.204 0.202 0.200 0.198 0.196 0.194 0.192
## [243] 0.190 0.188 0.186 0.184 0.182 0.180 0.178 0.176 0.174 0.172 0.170
## [254] 0.168 0.166 0.164 0.162 0.160 0.158 0.156 0.154 0.152 0.150 0.148
## [265] 0.146 0.144 0.142 0.140 0.138 0.136 0.134 0.132 0.130 0.128 0.126
## [276] 0.124 0.122 0.120 0.118 0.116 0.114 0.112 0.110 0.108 0.106 0.104
## [287] 0.102 0.100 0.098 0.096 0.094 0.092 0.090 0.088 0.086 0.084 0.082
## [298] 0.080 0.078 0.076 0.074 0.072 0.070 0.068 0.066 0.064 0.062 0.060
## [309] 0.058 0.056 0.054 0.052 0.050 0.048 0.046 0.044 0.042 0.040 0.038
## [320] 0.036 0.034 0.032 0.030 0.028 0.026 0.024 0.022 0.020 0.018 0.016
## [331] 0.014 0.012 0.010 0.008 0.006 0.004 0.002 0.000

Lift chart

perf1 <- performance(pred,"lift","rpp")
plot(perf1, main="lift curve", colorize=T)

LC <- max(attr(perf1, 'y.values')[[1]]-attr(perf1, 'x.values')[[1]])
LC
## [1] NaN

Area Under Curve

auc <- performance(pred,"auc"); 
auc <- as.numeric(auc@y.values)
auc
## [1] 0.947142
plot(perf)

Scoring syntax

test$predict.class <- predict(tRF2,test, type="class")
test$predict.score <- predict(tRF2,test, type="prob")
class(train$predict.score)
## [1] "matrix" "votes"

Confusion matrix

pred1 <- predict(tRF2, test)
cm1 <- table(Predict = pred1, actual = test$TARGET)
cm1
##        actual
## Predict    0    1
##       0 5198  698
##       1   22   82

Deciling the test data

decile <- function(x){
  deciles <- vector(length=10)
  for (i in seq(0.1,1,.1)){
    deciles[i*10] <- quantile(x, i, na.rm=T)
  }
  return (
    ifelse(x<deciles[1], 1,
           ifelse(x<deciles[2], 2,
                  ifelse(x<deciles[3], 3,
                         ifelse(x<deciles[4], 4,
                                ifelse(x<deciles[5], 5,
                                       ifelse(x<deciles[6], 6,
                                              ifelse(x<deciles[7], 7,
                                                     ifelse(x<deciles[8], 8,
                                                            ifelse(x<deciles[9], 9, 10
                                                            ))))))))))
}
test$deciles <- decile(test$predict.score[,2])

Rank Ordering

library(data.table)
tmp_DT1 = data.table(test)
rank1 <- tmp_DT1[, list(
  cnt = length(TARGET), 
  cnt_resp = sum(TARGET), 
  cnt_non_resp = sum(TARGET == 0)) , 
  by=deciles][order(-deciles)]
rank1$rrate <- round (rank1$cnt_resp / rank1$cnt,2);
rank1$cum_resp <- cumsum(rank1$cnt_resp)
rank1$cum_non_resp <- cumsum(rank1$cnt_non_resp)
rank1$cum_rel_resp <- round(rank1$cum_resp / sum(rank1$cnt_resp),2);
rank1$cum_rel_non_resp <- round(rank1$cum_non_resp / sum(rank1$cnt_non_resp),2);
rank1$ks <- abs(rank1$cum_rel_resp - rank1$cum_rel_non_resp);


library(scales)
rank1$rrate <- percent(rank1$rrate)
rank1$cum_rel_resp <- percent(rank1$cum_rel_resp)
rank1$cum_rel_non_resp <- percent(rank1$cum_rel_non_resp)
View(rank1)

KS

pred2 <- prediction(test$predict.score[,2], test$TARGET)
perf2 <- performance(pred2, "tpr", "fpr")
KS2 <- max(attr(perf2, 'y.values')[[1]]-attr(perf2, 'x.values')[[1]])
KS2
## [1] 0.6102122
perf
## An object of class "performance"
## Slot "x.name":
## [1] "False positive rate"
## 
## Slot "y.name":
## [1] "True positive rate"
## 
## Slot "alpha.name":
## [1] "Cutoff"
## 
## Slot "x.values":
## [[1]]
##   [1] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##   [6] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [11] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [16] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [21] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [26] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [31] 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00
##  [36] 0.000000e+00 0.000000e+00 0.000000e+00 8.151288e-05 8.151288e-05
##  [41] 8.151288e-05 1.630258e-04 2.445386e-04 2.445386e-04 2.445386e-04
##  [46] 2.445386e-04 2.445386e-04 2.445386e-04 3.260515e-04 4.075644e-04
##  [51] 4.075644e-04 4.075644e-04 4.075644e-04 4.075644e-04 4.075644e-04
##  [56] 4.890773e-04 4.890773e-04 4.890773e-04 5.705902e-04 5.705902e-04
##  [61] 5.705902e-04 5.705902e-04 5.705902e-04 7.336159e-04 7.336159e-04
##  [66] 8.151288e-04 8.151288e-04 8.151288e-04 8.151288e-04 8.151288e-04
##  [71] 8.151288e-04 8.966417e-04 8.966417e-04 9.781545e-04 9.781545e-04
##  [76] 1.141180e-03 1.141180e-03 1.141180e-03 1.141180e-03 1.141180e-03
##  [81] 1.141180e-03 1.141180e-03 1.141180e-03 1.222693e-03 1.222693e-03
##  [86] 1.222693e-03 1.304206e-03 1.385719e-03 1.385719e-03 1.385719e-03
##  [91] 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03
##  [96] 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03 1.467232e-03
## [101] 1.467232e-03 1.467232e-03 1.467232e-03 1.548745e-03 1.630258e-03
## [106] 1.630258e-03 1.630258e-03 1.630258e-03 1.630258e-03 1.630258e-03
## [111] 1.711770e-03 1.711770e-03 1.956309e-03 1.956309e-03 1.956309e-03
## [116] 1.956309e-03 2.119335e-03 2.119335e-03 2.119335e-03 2.119335e-03
## [121] 2.200848e-03 2.200848e-03 2.282361e-03 2.445386e-03 2.445386e-03
## [126] 2.445386e-03 2.526899e-03 2.526899e-03 2.689925e-03 2.852951e-03
## [131] 2.852951e-03 2.852951e-03 3.015977e-03 3.342028e-03 3.423541e-03
## [136] 3.505054e-03 3.505054e-03 3.505054e-03 3.505054e-03 3.505054e-03
## [141] 3.505054e-03 3.505054e-03 3.505054e-03 3.505054e-03 3.586567e-03
## [146] 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03
## [151] 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03 3.668080e-03
## [156] 3.831105e-03 3.831105e-03 3.831105e-03 3.831105e-03 3.831105e-03
## [161] 3.831105e-03 3.912618e-03 4.238670e-03 4.320183e-03 4.320183e-03
## [166] 4.320183e-03 4.483208e-03 4.564721e-03 4.564721e-03 4.646234e-03
## [171] 4.646234e-03 4.646234e-03 4.727747e-03 4.809260e-03 4.809260e-03
## [176] 4.809260e-03 4.890773e-03 4.972286e-03 5.135311e-03 5.298337e-03
## [181] 5.461363e-03 5.542876e-03 5.624389e-03 5.950440e-03 6.194979e-03
## [186] 6.602543e-03 6.602543e-03 6.684056e-03 6.928595e-03 7.254646e-03
## [191] 7.336159e-03 7.662211e-03 7.743724e-03 8.151288e-03 8.232801e-03
## [196] 8.640365e-03 8.721878e-03 8.803391e-03 8.966417e-03 9.047930e-03
## [201] 9.129442e-03 9.373981e-03 9.537007e-03 9.618520e-03 9.700033e-03
## [206] 9.781545e-03 9.863058e-03 9.863058e-03 9.944571e-03 1.018911e-02
## [211] 1.035214e-02 1.059667e-02 1.116726e-02 1.124878e-02 1.141180e-02
## [216] 1.149332e-02 1.190088e-02 1.198239e-02 1.238996e-02 1.263450e-02
## [221] 1.271601e-02 1.312357e-02 1.344963e-02 1.393870e-02 1.418324e-02
## [226] 1.459081e-02 1.483534e-02 1.507988e-02 1.532442e-02 1.565047e-02
## [231] 1.589501e-02 1.646560e-02 1.662863e-02 1.744376e-02 1.817737e-02
## [236] 1.866645e-02 1.923704e-02 1.948158e-02 1.980763e-02 2.037822e-02
## [241] 2.086730e-02 2.184545e-02 2.257907e-02 2.266058e-02 2.282361e-02
## [246] 2.314966e-02 2.461689e-02 2.486143e-02 2.535051e-02 2.608412e-02
## [251] 2.657320e-02 2.804043e-02 2.918161e-02 2.975220e-02 3.089338e-02
## [256] 3.179002e-02 3.325725e-02 3.382784e-02 3.439843e-02 3.594718e-02
## [261] 3.716987e-02 3.798500e-02 3.904467e-02 4.034888e-02 4.165308e-02
## [266] 4.295729e-02 4.401695e-02 4.475057e-02 4.572873e-02 4.703293e-02
## [271] 4.817411e-02 4.988588e-02 5.119009e-02 5.273883e-02 5.396153e-02
## [276] 5.510271e-02 5.640691e-02 5.803717e-02 5.901532e-02 6.048256e-02
## [281] 6.170525e-02 6.260189e-02 6.496576e-02 6.708510e-02 6.977502e-02
## [286] 7.140528e-02 7.311705e-02 7.458428e-02 7.548093e-02 7.800783e-02
## [291] 8.020867e-02 8.289860e-02 8.518096e-02 8.697424e-02 9.072383e-02
## [296] 9.341376e-02 9.553309e-02 9.765243e-02 1.000163e-01 1.032768e-01
## [301] 1.076785e-01 1.113466e-01 1.147701e-01 1.184382e-01 1.226769e-01
## [306] 1.270786e-01 1.305836e-01 1.354744e-01 1.411803e-01 1.460711e-01
## [311] 1.526736e-01 1.586241e-01 1.642485e-01 1.696283e-01 1.781872e-01
## [316] 1.847897e-01 1.924519e-01 2.014183e-01 2.123410e-01 2.208999e-01
## [321] 2.316596e-01 2.451907e-01 2.552983e-01 2.698076e-01 2.865178e-01
## [326] 3.042876e-01 3.218128e-01 3.420280e-01 3.672970e-01 3.937072e-01
## [331] 4.231334e-01 4.575318e-01 4.968210e-01 5.454842e-01 6.054777e-01
## [336] 6.755787e-01 7.791816e-01 1.000000e+00
## 
## 
## Slot "y.values":
## [[1]]
##   [1] 0.000000000 0.002886836 0.003464203 0.005196305 0.008083141
##   [6] 0.009237875 0.009815242 0.010392610 0.010969977 0.012124711
##  [11] 0.013856813 0.014434180 0.015588915 0.016166282 0.018475751
##  [16] 0.020785219 0.021362587 0.021939954 0.022517321 0.025981524
##  [21] 0.026558891 0.027136259 0.029445727 0.030600462 0.031177829
##  [26] 0.031755196 0.032332564 0.032909931 0.034064665 0.034642032
##  [31] 0.035219400 0.037528868 0.040993072 0.041570439 0.042725173
##  [36] 0.044457275 0.047921478 0.048498845 0.050808314 0.052540416
##  [41] 0.054849885 0.054849885 0.056004619 0.056581986 0.057736721
##  [46] 0.058314088 0.058891455 0.060046189 0.060623557 0.061778291
##  [51] 0.062355658 0.062933025 0.063510393 0.064665127 0.065819861
##  [56] 0.065819861 0.066397229 0.066974596 0.068706697 0.069284065
##  [61] 0.069861432 0.071016166 0.071593533 0.073325635 0.074480370
##  [66] 0.075057737 0.075635104 0.077367206 0.078521940 0.081408776
##  [71] 0.081986143 0.083718245 0.084872979 0.088337182 0.089491917
##  [76] 0.089491917 0.090646651 0.092956120 0.093533487 0.094688222
##  [81] 0.095265589 0.095842956 0.097575058 0.098152425 0.098729792
##  [86] 0.100461894 0.102771363 0.103348730 0.106235566 0.107967667
##  [91] 0.107967667 0.112009238 0.113163972 0.117205543 0.117782910
##  [96] 0.118937644 0.119515012 0.121247113 0.123556582 0.124711316
## [101] 0.125288684 0.126443418 0.127020785 0.128752887 0.131062356
## [106] 0.132217090 0.134526559 0.135681293 0.136258661 0.139722864
## [111] 0.140877598 0.142032333 0.142032333 0.142609700 0.144919169
## [116] 0.146651270 0.146651270 0.148960739 0.151270208 0.152424942
## [121] 0.152424942 0.153002309 0.155311778 0.157621247 0.158775982
## [126] 0.162240185 0.163394919 0.163972286 0.168591224 0.169745958
## [131] 0.171478060 0.176096998 0.178983834 0.181293303 0.184180139
## [136] 0.185334873 0.185912240 0.187644342 0.188221709 0.192263279
## [141] 0.195150115 0.196304850 0.197459584 0.198614319 0.199769053
## [146] 0.199769053 0.203233256 0.206120092 0.207852194 0.210161663
## [151] 0.211893764 0.214203233 0.217090069 0.218822171 0.219399538
## [156] 0.221709007 0.223441109 0.224595843 0.225173210 0.227482679
## [161] 0.232101617 0.233833718 0.236143187 0.237297921 0.239607390
## [166] 0.242494226 0.248845266 0.252309469 0.254618938 0.258083141
## [171] 0.261547344 0.267898383 0.270785219 0.273094688 0.276558891
## [176] 0.279445727 0.285796767 0.290993072 0.293879908 0.300230947
## [181] 0.306581986 0.308891455 0.313510393 0.316397229 0.318129330
## [186] 0.320438799 0.322748268 0.325635104 0.325635104 0.331408776
## [191] 0.337182448 0.340646651 0.341801386 0.343533487 0.344688222
## [196] 0.346997691 0.351039261 0.356235566 0.358545035 0.360277136
## [201] 0.361431871 0.362586605 0.367205543 0.370669746 0.375866051
## [206] 0.380484988 0.381639723 0.383949192 0.387413395 0.390877598
## [211] 0.392032333 0.397228637 0.400115473 0.404734411 0.406466513
## [216] 0.412817552 0.418013857 0.419745958 0.428406467 0.431293303
## [221] 0.433602771 0.438799076 0.442840647 0.443995381 0.448036952
## [226] 0.451501155 0.455542725 0.464780600 0.468244804 0.477482679
## [231] 0.483256351 0.487875289 0.491339492 0.495381062 0.499422633
## [236] 0.501154734 0.502886836 0.506351039 0.508660508 0.509237875
## [241] 0.513856813 0.515011547 0.521362587 0.525981524 0.531177829
## [246] 0.535796767 0.540993072 0.550230947 0.554849885 0.564087760
## [251] 0.568129330 0.575057737 0.577944573 0.581986143 0.587182448
## [256] 0.591801386 0.595265589 0.599307159 0.600461894 0.602771363
## [261] 0.608545035 0.613741339 0.623556582 0.631639723 0.636258661
## [266] 0.643187067 0.647806005 0.656466513 0.661085450 0.665704388
## [271] 0.670900693 0.678983834 0.686489607 0.691685912 0.699769053
## [276] 0.706697460 0.710739030 0.713048499 0.715935335 0.721131640
## [281] 0.725750577 0.732101617 0.737297921 0.742494226 0.749422633
## [286] 0.753464203 0.756351039 0.758660508 0.762702079 0.767898383
## [291] 0.772517321 0.777713626 0.782909931 0.790993072 0.798498845
## [296] 0.808314088 0.813510393 0.821016166 0.829099307 0.834872979
## [301] 0.840069284 0.851039261 0.859699769 0.867782910 0.871824480
## [306] 0.876443418 0.882794457 0.886258661 0.894919169 0.900692841
## [311] 0.904734411 0.909353349 0.911662818 0.919168591 0.924942263
## [316] 0.931870670 0.937066975 0.941685912 0.949769053 0.954387991
## [321] 0.960739030 0.963048499 0.966512702 0.974018476 0.976905312
## [326] 0.980946882 0.984411085 0.987875289 0.990762125 0.992494226
## [331] 0.994803695 0.995958430 0.997690531 0.997690531 0.998267898
## [336] 0.998845266 0.999422633 1.000000000
## 
## 
## Slot "alpha.values":
## [[1]]
##   [1]   Inf 0.950 0.876 0.874 0.856 0.852 0.838 0.836 0.808 0.802 0.800
##  [12] 0.794 0.766 0.756 0.752 0.748 0.746 0.740 0.736 0.732 0.730 0.726
##  [23] 0.724 0.722 0.720 0.718 0.714 0.712 0.710 0.708 0.706 0.704 0.702
##  [34] 0.698 0.694 0.688 0.686 0.684 0.682 0.680 0.678 0.668 0.664 0.656
##  [45] 0.652 0.646 0.644 0.640 0.638 0.636 0.634 0.628 0.624 0.622 0.620
##  [56] 0.618 0.616 0.614 0.612 0.610 0.608 0.606 0.604 0.588 0.586 0.584
##  [67] 0.582 0.580 0.578 0.576 0.574 0.572 0.570 0.566 0.564 0.562 0.560
##  [78] 0.558 0.554 0.552 0.550 0.548 0.546 0.544 0.538 0.532 0.530 0.526
##  [89] 0.522 0.520 0.518 0.512 0.510 0.508 0.504 0.502 0.500 0.498 0.496
## [100] 0.490 0.488 0.486 0.484 0.482 0.480 0.476 0.474 0.472 0.470 0.468
## [111] 0.466 0.462 0.460 0.458 0.456 0.454 0.452 0.448 0.446 0.442 0.440
## [122] 0.438 0.436 0.434 0.432 0.430 0.428 0.426 0.422 0.420 0.418 0.416
## [133] 0.414 0.412 0.410 0.408 0.406 0.404 0.402 0.400 0.398 0.396 0.394
## [144] 0.392 0.390 0.388 0.386 0.384 0.382 0.380 0.378 0.376 0.374 0.372
## [155] 0.370 0.368 0.366 0.364 0.362 0.360 0.358 0.356 0.354 0.352 0.346
## [166] 0.344 0.342 0.340 0.338 0.336 0.334 0.332 0.330 0.328 0.326 0.324
## [177] 0.322 0.320 0.318 0.316 0.314 0.312 0.310 0.308 0.306 0.304 0.302
## [188] 0.300 0.298 0.296 0.294 0.292 0.290 0.288 0.286 0.284 0.282 0.280
## [199] 0.278 0.276 0.274 0.272 0.270 0.268 0.266 0.264 0.262 0.260 0.258
## [210] 0.256 0.254 0.252 0.250 0.248 0.246 0.244 0.242 0.240 0.238 0.236
## [221] 0.234 0.232 0.230 0.228 0.226 0.224 0.222 0.220 0.218 0.216 0.214
## [232] 0.212 0.210 0.208 0.206 0.204 0.202 0.200 0.198 0.196 0.194 0.192
## [243] 0.190 0.188 0.186 0.184 0.182 0.180 0.178 0.176 0.174 0.172 0.170
## [254] 0.168 0.166 0.164 0.162 0.160 0.158 0.156 0.154 0.152 0.150 0.148
## [265] 0.146 0.144 0.142 0.140 0.138 0.136 0.134 0.132 0.130 0.128 0.126
## [276] 0.124 0.122 0.120 0.118 0.116 0.114 0.112 0.110 0.108 0.106 0.104
## [287] 0.102 0.100 0.098 0.096 0.094 0.092 0.090 0.088 0.086 0.084 0.082
## [298] 0.080 0.078 0.076 0.074 0.072 0.070 0.068 0.066 0.064 0.062 0.060
## [309] 0.058 0.056 0.054 0.052 0.050 0.048 0.046 0.044 0.042 0.040 0.038
## [320] 0.036 0.034 0.032 0.030 0.028 0.026 0.024 0.022 0.020 0.018 0.016
## [331] 0.014 0.012 0.010 0.008 0.006 0.004 0.002 0.000

Lift chart

perf3 <- performance(pred2,"lift","rpp")

Area Under Curve

auc <- performance(pred2,"auc"); 
auc <- as.numeric(auc@y.values)
auc
## [1] 0.8727702
plot(perf2)