library("tidyverse")
library("here")
library("beeswarm")
library("ggplot2")
micro_aus <- read.csv(here("data","micro_aus.csv"))
glimpse(micro_aus)
## Rows: 1,000
## Columns: 83
## $ economy <chr> "Australia", "Australia", "Australia", "Australia"…
## $ economycode <chr> "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "…
## $ wpid_random <int> 160288803, 151789780, 148625405, 192142847, 169882…
## $ wgt <dbl> 1.2575536, 1.2669981, 0.1833565, 0.8274972, 1.0198…
## $ female <int> 2, 2, 1, 2, 2, 1, 2, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2,…
## $ age <int> 61, 22, 66, 84, 30, 67, 20, 69, 40, 47, 81, 91, 36…
## $ educ <int> 2, 3, 3, 1, 3, 2, 5, 2, 3, 3, 3, 2, 3, 3, 2, 3, 2,…
## $ inc_q <int> 5, 1, 4, 5, 4, 3, 4, 4, 1, 2, 4, 1, 1, 3, 1, 4, 1,…
## $ emp_in <int> 1, 2, 2, 2, 1, 2, 2, 2, 1, 2, 2, 2, 1, 1, 2, 2, 2,…
## $ urbanicity_f2f <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ account <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,…
## $ account_fin <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,…
## $ fin2 <int> 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,…
## $ fin4 <int> 1, 1, 1, NA, 1, 1, 4, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1…
## $ fin5 <int> 1, 1, 1, 2, 1, 1, 1, 1, 1, 2, 1, 2, 1, 1, 2, 1, 2,…
## $ fin6 <int> 1, 1, 1, 2, 1, 1, 1, 1, 1, 2, 1, 2, 1, 1, 2, 1, 1,…
## $ fin7 <int> 1, 2, 1, 1, 1, 1, 2, 1, 1, 1, 2, 2, 2, 1, 2, 1, 1,…
## $ fin8 <int> 1, NA, 1, 1, 1, 1, NA, 1, 2, 1, NA, NA, NA, 1, NA,…
## $ fin8b <int> 2, NA, 1, 1, 1, 1, NA, 1, 1, 1, NA, NA, NA, 1, NA,…
## $ fin9 <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1,…
## $ fin9a <int> 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 2, 1, NA, 1, 1…
## $ fin10 <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1,…
## $ fin10a <int> 1, 1, 1, 1, 1, 1, 4, 1, 1, 1, 1, 1, 1, 1, NA, 1, 1…
## $ fin10b <int> 1, 1, 1, 1, 1, 1, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2,…
## $ fin11_1 <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11a <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11b <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11c <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11d <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11e <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11f <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11g <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin11h <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin13a <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin13b <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin13c <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin13d <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin14_1 <int> 2, 1, 1, 2, 2, 2, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2,…
## $ fin14a <int> 1, 1, 1, 2, 1, 1, 2, 1, 1, 2, 2, 2, 1, 1, 2, 1, 2,…
## $ fin14a1 <int> 1, 1, 1, 2, 1, 2, 1, 1, 1, 2, 2, 2, 1, 2, 2, 1, 2,…
## $ fin14b <int> 1, 1, 2, 2, 1, 1, 2, 1, 1, 2, 2, 2, 1, 1, 2, 1, 2,…
## $ fin16 <int> 2, 2, 1, 2, 1, 2, 2, 1, 2, 1, 1, 2, 1, 2, 1, 2, 2,…
## $ fin17a <int> 1, 1, 1, 2, 1, 2, 2, 1, 1, 1, 1, 2, 1, 2, 2, 2, 2,…
## $ fin17a1 <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin20 <int> 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 2, 2, 2, 2, 2,…
## $ fin22a <int> 2, 2, 2, 2, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,…
## $ fin22b <int> 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,…
## $ fin24 <int> 6, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 4, 1, 1, 1,…
## $ fin24a <int> 2, 3, 3, 3, 3, 2, 3, 3, 2, 2, 3, 3, 1, 3, 2, 2, 3,…
## $ fin24b <int> 1, 3, 3, 3, 3, 2, 2, 3, 2, 1, 3, 3, 1, 3, 2, 2, 3,…
## $ fin30 <int> 1, 1, 1, 2, 1, 1, 2, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1,…
## $ fin31a <int> 1, 1, 1, NA, 1, 1, NA, 1, 1, NA, 1, 1, 1, 1, 1, 1,…
## $ fin31b <int> 2, 1, 2, NA, 2, 2, NA, 2, 2, NA, 2, 2, 1, 2, 2, 2,…
## $ fin31c <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin32 <int> 1, 1, 1, 2, 1, 2, 1, 2, 1, 2, 2, 2, 2, 1, 2, 2, 2,…
## $ fin33 <int> 2, 2, 1, NA, 2, NA, 2, NA, 1, NA, NA, NA, NA, 2, N…
## $ fin34a <int> 1, 1, 1, NA, 1, NA, 1, NA, 1, NA, NA, NA, NA, 1, N…
## $ fin34b <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin34d <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin34e <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin37 <int> 2, 1, 1, 2, 2, 2, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2,…
## $ fin38 <int> 2, 2, 1, 1, 2, 2, 2, 1, 2, 2, 1, 1, 2, 2, 1, 2, 1,…
## $ fin39a <int> NA, 1, 1, 2, NA, NA, 1, 1, 1, NA, 1, 1, NA, NA, 1,…
## $ fin39b <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ fin39d <int> NA, NA, NA, 2, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
## $ fin39e <int> NA, NA, NA, 2, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
## $ fin44a <int> 2, 3, 3, 3, 3, 2, 3, 3, 2, 2, 3, 3, 3, 3, 1, 2, 3,…
## $ fin44b <int> 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 1, 3, 1, 2, 3,…
## $ fin44c <int> 2, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 2, 3, 3,…
## $ fin44d <int> 3, 3, 3, 4, 2, 3, 3, 3, 2, 3, 4, 3, 3, 3, 4, 3, 3,…
## $ fin45 <int> 1, NA, NA, NA, NA, NA, NA, NA, 3, 1, NA, NA, NA, N…
## $ saved <int> 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0,…
## $ borrowed <int> 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1,…
## $ receive_wages <int> 1, 1, 1, 4, 1, 4, 1, 4, 1, 4, 4, 4, 4, 1, 4, 4, 4,…
## $ receive_transfers <int> 4, 1, 1, 4, 4, 4, 1, 1, 1, 4, 4, 4, 4, 4, 4, 4, 4,…
## $ receive_pension <int> 4, 4, 1, 3, 4, 4, 4, 1, 4, 4, 1, 1, 4, 4, 1, 4, 1,…
## $ receive_agriculture <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ pay_utilities <int> 1, 1, 1, 4, 1, 1, 4, 1, 1, 4, 1, 1, 1, 1, 1, 1, 1,…
## $ remittances <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
## $ mobileowner <int> 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1,…
## $ internetaccess <int> 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1,…
## $ anydigpayment <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,…
## $ merchantpay_dig <lgl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
micro_aus$female <- factor(micro_aus$female, levels = c(1, 2), labels = c("Female", "Male"))
micro_aus %>%
select(female,inc_q) %>%
rename(income = inc_q) %>%
na.omit() %>%
ggplot(aes(x = female, y = income )) +
geom_boxplot() +
labs(x = "Gender", y = "Income", title = "Income Distribution by Gender")
filtered by >3 we donn’t have data for fin4a = use debit card in-store so we are using fin4 = use debit card instead
micro_aus$account_fin <- as.factor(micro_aus$account_fin)
micro_aus$fin4 <- as.factor(micro_aus$fin4)
micro_aus$fin14a <- as.factor(micro_aus$fin14a)
# 整理数据
micro_aus_clean <- micro_aus %>%
filter(!is.na(female), !is.na(inc_q), !is.na(fin4), !is.na(fin14a)) %>%
mutate(
female = factor(female, levels = c("Female", "Male")),
inc_q = factor(inc_q, levels = 1:5, labels = paste0("Q", 1:5)),
fin4 = factor(fin4, levels = c(1, 2), labels = c("Debit: Yes", "Debit: No")),
fin14a = factor(fin14a, levels = c(1, 2), labels = c("Online: Yes", "Online: No"))
) %>%
pivot_longer(cols = c(fin4, fin14a), names_to = "payment_type", values_to = "payment_status")
ggplot(micro_aus_clean, aes(x = payment_status, fill = inc_q)) +
geom_bar(position = "dodge") +
facet_wrap(~ female) +
labs(
title = "Payment Behavior by Gender and Income Quintile",
x = "Payment Method & Response",
y = "Count",
fill = "Income Quintile") +
theme_minimal() +
theme(axis.text.x = element_text(angle = 45, hjust = 1))
## cda from the graph - the overall usage of debit card is always higher
than online. - male tend to pay more by both debit card and online as
they become wealthier. -the female within q2 income spend money the most
than any other quntile income level; as women’s income grow higher, the
gap between using debit card and online payment seems to become smaller,
compared with the larger preference of using credit card among women in
q1 income class. -women spent more money than men in all income quntile
level except Q5. (may consider it with domestic care–>spend money for
the family, pregnancy etc.)
select(female,fin14_1,inc_q,fin14a)