Peijun

PATH <- "E:/kkbox/"
# load data
raw_train <- fread(paste0(PATH,"raw_train.csv"), sep=",", na.strings = "", stringsAsFactors=F)

Read 44.5% of 1259066 rows
Read 68.3% of 1259066 rows
Read 96.9% of 1259066 rows
Read 1259066 rows and 28 (of 28) columns from 0.158 GB file in 00:00:05

Discriptive plot

1.payment_method and is_churn

## is_churn
##       0       1 
## 1185333   73733

2.is_duplicate and is_churn

##         is_duplicate
## is_churn          0          1
##        0 0.06515806 0.93484194
##        1 0.72266149 0.27733851

3.registered_via and is_churn

##         registered_via
## is_churn           13            3            4            7            9
##        0 0.0004867830 0.0197902193 0.0075371225 0.1037320314 0.0502010827
##        1 0.0008137469 0.0409721563 0.0252532787 0.0498691224 0.0645708163
##         registered_via
## is_churn           NA
##        0 0.8182527610
##        1 0.8185208794

4.is_auto_renew and is_churn

##         is_auto_renew
## is_churn          0          1         NA
##        0 0.03980654 0.58394223 0.37625123
##        1 0.14742381 0.30714877 0.54542742