library(ggplot2)
library(plotly)
##
## Attaching package: 'plotly'
## The following object is masked from 'package:ggplot2':
##
## last_plot
## The following object is masked from 'package:stats':
##
## filter
## The following object is masked from 'package:graphics':
##
## layout
library(readr)
library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
default <- read_csv("D:/RMIT/Data-Visualisation/R/default.csv")
## Parsed with column specification:
## cols(
## .default = col_integer()
## )
## See spec(...) for full column specifications.
default$EDUCATION[default$EDUCATION == 1] <- "Graduate school"
default$EDUCATION[default$EDUCATION == 2] <- "University"
default$EDUCATION[default$EDUCATION == 3] <- "High school"
default$EDUCATION[default$EDUCATION == 0] <- "Others"
default$EDUCATION[default$EDUCATION == 4] <- "Others"
default$EDUCATION[default$EDUCATION == 5] <- "Others"
default$EDUCATION[default$EDUCATION == 6] <- "Others"
#default$MARRIAGE <- factor(default$MARRIAGE, levels=c(1,2,0,3),labels = c("married","single",0,"other"),ordered = TRUE)
default$MARRIAGE[default$MARRIAGE ==1] <- "Married"
default$MARRIAGE[default$MARRIAGE ==2] <- "Single"
default$MARRIAGE[default$MARRIAGE ==0] <- "Other"
default$MARRIAGE[default$MARRIAGE ==3] <- "Other"
default$PAY_0[default$PAY_0 ==-2] <- "pay duly"
default$PAY_0[default$PAY_0 ==-1] <- "pay duly"
default$PAY_0[default$PAY_0 ==0] <- "pay duly"
default$PAY_0[default$PAY_0 ==1] <- "payment delay for one month"
default$PAY_0[default$PAY_0 ==2] <- "payment delay for two months"
default$PAY_0[default$PAY_0 ==3] <- "payment delay for three months"
default$PAY_0[default$PAY_0 ==4] <- "payment delay for four months"
default$PAY_0[default$PAY_0 ==5] <- "payment delay for five months"
default$PAY_0[default$PAY_0 ==6] <- "payment delay for six months"
default$PAY_0[default$PAY_0 ==7] <- "payment delay for seven months"
default$PAY_0[default$PAY_0 ==8] <- "payment delay for eight months"
default$PAY_2[default$PAY_2 ==-2] <- "pay2 duly"
default$PAY_2[default$PAY_2 ==-1] <- "pay2 duly"
default$PAY_2[default$PAY_2 ==0] <- "pay2 duly"
default$PAY_2[default$PAY_2 ==1] <- "payment2 delay for one month"
default$PAY_2[default$PAY_2 ==2] <- "payment2 delay for two months"
default$PAY_2[default$PAY_2 ==3] <- "payment2 delay for three months"
default$PAY_2[default$PAY_2 ==4] <- "payment2 delay for four months"
default$PAY_2[default$PAY_2 ==5] <- "payment2 delay for five months"
default$PAY_2[default$PAY_2 ==6] <- "payment2 delay for six months"
default$PAY_2[default$PAY_2 ==7] <- "payment2 delay for seven months"
default$PAY_2[default$PAY_2 ==8] <- "payment2 delay for eight months"
default$PAY_3[default$PAY_3 ==-2] <- "pay3 duly"
default$PAY_3[default$PAY_3 ==-1] <- "pay3 duly"
default$PAY_3[default$PAY_3 ==0] <- "pay3 duly"
default$PAY_3[default$PAY_3 ==1] <- "payment3 delay for one month"
default$PAY_3[default$PAY_3 ==2] <- "payment3 delay for two months"
default$PAY_3[default$PAY_3 ==3] <- "payment3 delay for three months"
default$PAY_3[default$PAY_3 ==4] <- "payment3 delay for four months"
default$PAY_3[default$PAY_3 ==5] <- "payment3 delay for five months"
default$PAY_3[default$PAY_3 ==6] <- "payment3 delay for six months"
default$PAY_3[default$PAY_3 ==7] <- "payment3 delay for seven months"
default$PAY_3[default$PAY_3 ==8] <- "payment3 delay for eight months"
default$PAY_4[default$PAY_4 ==-2] <- "pay duly"
default$PAY_4[default$PAY_4 ==-1] <- "pay duly"
default$PAY_4[default$PAY_4 ==0] <- "pay duly"
default$PAY_4[default$PAY_4 ==1] <- "payment delay for one month"
default$PAY_4[default$PAY_4 ==2] <- "payment delay for two months"
default$PAY_4[default$PAY_4 ==3] <- "payment delay for three months"
default$PAY_4[default$PAY_4 ==4] <- "payment delay for four months"
default$PAY_4[default$PAY_4 ==5] <- "payment delay for five months"
default$PAY_4[default$PAY_4 ==6] <- "payment delay for six months"
default$PAY_4[default$PAY_4 ==7] <- "payment delay for seven months"
default$PAY_4[default$PAY_4 ==8] <- "payment delay for eight months"
default$PAY_5[default$PAY_5 ==-2] <- "pay duly"
default$PAY_5[default$PAY_5 ==-1] <- "pay duly"
default$PAY_5[default$PAY_5 ==0] <- "pay duly"
default$PAY_5[default$PAY_5 ==1] <- "payment delay for one month"
default$PAY_5[default$PAY_5 ==2] <- "payment delay for two months"
default$PAY_5[default$PAY_5 ==3] <- "payment delay for three months"
default$PAY_5[default$PAY_5 ==4] <- "payment delay for four months"
default$PAY_5[default$PAY_5 ==5] <- "payment delay for five months"
default$PAY_5[default$PAY_5 ==6] <- "payment delay for six months"
default$PAY_5[default$PAY_5 ==7] <- "payment delay for seven months"
default$PAY_5[default$PAY_5 ==8] <- "payment delay for eight months"
default$PAY_6[default$PAY_6 ==-2] <- "pay duly"
default$PAY_6[default$PAY_6 ==-1] <- "pay duly"
default$PAY_6[default$PAY_6 ==0] <- "pay duly"
default$PAY_6[default$PAY_6 ==1] <- "payment delay for one month"
default$PAY_6[default$PAY_6 ==2] <- "payment delay for two months"
default$PAY_6[default$PAY_6 ==3] <- "payment delay for three months"
default$PAY_6[default$PAY_6 ==4] <- "payment delay for four months"
default$PAY_6[default$PAY_6 ==5] <- "payment delay for five months"
default$PAY_6[default$PAY_6 ==6] <- "payment delay for six months"
default$PAY_6[default$PAY_6 ==7] <- "payment delay for seven months"
default$PAY_6[default$PAY_6 ==8] <- "payment delay for eight months"
default$AGE_GROUP[default$AGE>= 20 & default$AGE < 30] <- "20-29"
## Warning: Unknown or uninitialised column: 'AGE_GROUP'.
default$AGE_GROUP[default$AGE>= 30 & default$AGE < 40] <- "30-39"
default$AGE_GROUP[default$AGE>= 40 & default$AGE < 50] <- "40-49"
default$AGE_GROUP[default$AGE>= 50 & default$AGE < 60] <- "50-59"
default$AGE_GROUP[default$AGE>= 60 & default$AGE < 70] <- "60-69"
default$AGE_GROUP[default$AGE>= 70 & default$AGE < 80] <- "70-79"
default$default <- factor(default$default, levels=c(1,0),labels = c("Yes","No"),ordered = TRUE)
default$SEX <- factor(default$SEX, levels=c(1,2),labels = c("Male","Female"),ordered = TRUE)
default$EDUCATION <- default$EDUCATION %>%
factor(levels = c("Graduate school","University", "High school","Others",
ordered = TRUE))
default$MARRIAGE <- default$MARRIAGE %>%
factor(levels = c("Married","Single", "Other",
ordered = TRUE))
f <- list(
family = "Courier New, monospace",
size = 18,
color = "black")
a <- list(
text = "Limit Balance Group By Education",
font = f,
xref = "paper",
yref = "paper",
yanchor = "bottom",
xanchor = "center",
align = "center",
x = 0.5,
y = 1,
showarrow = FALSE
)
p14 <- plot_ly(data = default, x = ~EDUCATION, y = ~LIMIT_BAL, type = "box") %>%
layout(annotations = a) %>%
layout(yaxis = list(zeroline = FALSE, title = "Limit Balance"),
xaxis = list(zeroline = FALSE, title = "Education"))
p14