Peijun
PATH <- "E:/kkbox/"
# load data
raw_train <- fread(paste0(PATH,"raw_train.csv"), sep=",", na.strings = "", stringsAsFactors=F)
Read 44.5% of 1259066 rows
Read 68.3% of 1259066 rows
Read 96.9% of 1259066 rows
Read 1259066 rows and 28 (of 28) columns from 0.158 GB file in 00:00:05
Discriptive plot
1.payment_method and is_churn

## is_churn
## 0 1
## 1185333 73733
2.is_duplicate and is_churn

## is_duplicate
## is_churn 0 1
## 0 0.06515806 0.93484194
## 1 0.72266149 0.27733851
3.registered_via and is_churn

## registered_via
## is_churn 13 3 4 7 9
## 0 0.0004867830 0.0197902193 0.0075371225 0.1037320314 0.0502010827
## 1 0.0008137469 0.0409721563 0.0252532787 0.0498691224 0.0645708163
## registered_via
## is_churn NA
## 0 0.8182527610
## 1 0.8185208794
4.is_auto_renew and is_churn

## is_auto_renew
## is_churn 0 1 NA
## 0 0.03980654 0.58394223 0.37625123
## 1 0.14742381 0.30714877 0.54542742