How Does Household Composition Affect Basket Size and Frequency of Purchases?

## How Does Household Composition Affect Basket Size and Frequency of Purchases?

joined_data <- transactions %>%
  inner_join(demographics, by = "household_id") 

summary_stats <- joined_data %>%
  group_by(household_id) %>%
  summarize(total_sales = sum(sales_value, na.rm = TRUE))

frequency_of_purchases <- joined_data %>%
  group_by(household_id) %>%
  summarize(purchase_frequency = n_distinct(basket_id))

basket_size <- summary_stats %>%
  left_join(frequency_of_purchases, by = "household_id") %>%
  left_join(demographics %>% select(household_id, age), by = "household_id")

ggplot(basket_size, aes(x = purchase_frequency, y = total_sales, fill = age)) +
  geom_boxplot(alpha = .5) +
  scale_fill_manual(values = my_colors1) +
  facet_grid(~ age) + 
  labs(
    title = "Total Sales vs. Frequency of Purchases",
    x = "Frequency of Purchases",
    y = "Total Sales") + 
  theme_linedraw()