Economist-Style Plot using R

R Codes for Data Cleaning and Visualization
Above Economist-Style Plot can be created by using R as follows:
#==========================================
# Collect data from WHO and pre-process
#==========================================
# devtools::install_github("expersso/WHO")
library(WHO)
library(tidyverse)
# Government and total expenditure data:
expenditure_gov <- get_data("WHS7_108")
expenditure_total <- get_data("WHS7_105")
expenditure_gov %>%
filter(year == 2014, !is.na(country)) %>%
select(gov_exp = value, country) -> df_gov
expenditure_total %>%
filter(year == 2014, !is.na(country)) %>%
select(total_exp = value, country) -> df_total
nations <- intersect(df_gov$country, df_total$country)
full_join(df_total %>% filter(country %in% nations),
df_gov %>% filter(country %in% nations), by = "country") %>%
select(country, everything()) %>%
mutate(private_exp = total_exp - gov_exp) %>%
mutate(gov_rate = gov_exp / total_exp) %>%
arrange(gov_rate) %>%
mutate(rank = 1:nrow(.)) -> dfPlot
# Rename:
dfPlot %>%
mutate(country = case_when(country == "Brunei Darussalam" ~ "Brunei",
country == "Republic of Korea" ~ "South Korea",
country == "United Kingdom of Great Britain and Northern Ireland" ~ "United Kingdom",
country == "United States of America" ~ "United States",
country == "Russian Federation" ~ "Russia",
country == "Viet Nam" ~ "Vietnam",
TRUE ~ country)) -> dfPlot
# Some countries selected:
northernCon <- c("Denmark", "Finland", "Norway", "Sweden")
specialCon <- c("Qatar", "Brunei", "Cuba")
aseanCon <- c("Singapore", "Thailand", "Malaysia", "Vietnam")
others <- c("India", "China", "United States", "United Kingdom", "France",
"Germany", "Canada", "Japan", "South Korea")
dfPlot %>%
filter(country %in% c(northernCon, specialCon, aseanCon, others)) %>%
arrange(gov_rate) -> df
my_levels <- df %>% pull(country)
df %>%
mutate(country = factor(country, levels = my_levels)) %>%
select(country, private_exp, gov_exp) %>%
gather(type, value, -country) -> df1
# Colors and font selected: http://pattern-library.economist.com/color.html
# https://yutannihilation.github.io/allYourFigureAreBelongToUs/ggthemes/economist_pal/
my_colors <- c("#014d64", "#01a2d9")
my_font <- "Ubuntu Condensed"
colorLevels <- c("private_exp", "gov_exp")
#==================================
# Solution 1 (but i do not like)
#==================================
df1 %>%
mutate(type = factor(type, levels = colorLevels)) -> df1
df1 %>%
ggplot(aes(x = country, y = value, fill = type)) +
geom_col(position = "fill") +
coord_flip() +
scale_fill_manual(values = my_colors) +
theme_minimal(base_family = my_font)
#================
# Solution 2
#================
library(ggrepel)
df %>%
mutate(gov_rate = 100*gov_rate, total_rate = 100) %>%
mutate(country = factor(country, levels = country)) %>%
mutate(label = round(gov_rate, 1) %>% as.character()) %>%
mutate(label = case_when(!str_detect(label, "\\.") ~ paste0(label, ".0"), TRUE ~ label)) %>%
mutate(label = paste0(label, "%")) %>%
mutate(label_money = round(total_exp, 0) %>% scales::dollar()) -> dfSolution2
# Version 1:
ggplot() +
coord_flip() +
theme_minimal(base_family = my_font, base_size = 14) +
geom_col(data = dfSolution2, aes(x = country, y = total_rate, fill = "Government"), width = 0.9) +
geom_col(data = dfSolution2, aes(x = country, y = gov_rate, fill = "Private"), width = 0.9) +
scale_y_continuous(limits = c(0, 120)) +
geom_text(data = dfSolution2, aes(x = country, y = 5, label = label), color = "white", family = my_font, size = 4.5) +
scale_fill_manual(values = my_colors) +
geom_label_repel(data = dfSolution2, aes(x = country, y = 103, label = label_money), hjust = 0,
family = my_font, size = 4.3, direction = "x", nudge_y = 1, label.r = 0, box.padding = 0) +
theme(legend.position = "top")
# Version 2:
midd <- (102 + 110) / 2
dfSolution2 %>%
mutate(color_label_y = case_when(country == "Vietnam" ~ "#e5001c", TRUE ~ "grey20")) %>%
mutate(bold_y = case_when(country == "Vietnam" ~ "bold", TRUE ~ "plain")) -> dfSolution2
ggplot() +
coord_flip() +
theme_minimal(base_family = my_font, base_size = 14) +
geom_col(data = dfSolution2, aes(x = country, y = total_rate, fill = "Private"), width = 0.9) +
geom_col(data = dfSolution2, aes(x = country, y = gov_rate, fill = "Government"), width = 0.9) +
scale_y_continuous(limits = c(0, 110), expand = c(0, 0)) +
scale_x_discrete(expand = c(0.08, 0)) +
geom_text(data = dfSolution2, aes(x = country, y = 4, label = label), color = "white", family = my_font, size = 4.5) +
scale_fill_manual(values = my_colors) +
theme(legend.direction = "horizontal") +
theme(legend.position = c(0.5, 0.98)) +
theme(legend.title = element_blank()) +
theme(axis.title = element_blank()) +
theme(axis.text.x = element_blank()) +
theme(panel.grid = element_blank()) +
geom_rect(aes(xmin = 0.5, xmax = Inf, ymin = 102, ymax = 110), fill = "#efefe3") +
geom_text(data = dfSolution2 %>% filter(country == "Cuba"), aes(x = country, y = 106, label = "Total"),
vjust = -1.9, family = my_font, fontface = "bold", size = 4.5) +
geom_text(data = dfSolution2, aes(x = country, y = midd, label = scales::comma(round(total_exp, 0))),
family = my_font, size = 4.5, color = "grey30") +
theme(plot.margin = unit(rep(0.5, 4), "cm")) +
labs(x = NULL, y = NULL,
title = "Share of Vietnam government spending on health care, 2014",
subtitle = "Heath expenditure per capita in Vietnam was reported at $390 (PPP)\nand share of government spending on health care was 54.1%.",
caption = "Source: World Health Organization (WHO)") +
theme(plot.title = element_text(size = 23, colour = "grey20"),
plot.subtitle = element_text(color = "grey30", size = 15),
plot.caption = element_text(color = "grey30", face = "italic", size = 11)) +
theme(axis.text.y = element_text(color = dfSolution2$color_label_y, size = 12, face = dfSolution2$bold_y))
library(grid)
grid.rect(x = 0.015, y = 0.94, hjust = 1, vjust = 0, gp = gpar(fill = "#e5001c", lwd = 0))
grid.rect(x = 1, y = 1 - 0.005, hjust = 1, vjust = 0, gp = gpar(fill = "#e5001c", lwd = 0))
---
title: "Share of Vietnam government spending on health care, 2014 "
author: 'Nguyen Chi Dung'
subtitle: "Daily Graph Series"
output:
  html_document: 
    code_download: true
    #   code_folding: hide
    highlight: zenburn
    # number_sections: yes
    theme: "flatly"
    toc: TRUE
    toc_float: TRUE
---

```{r setup,include=FALSE}
knitr::opts_chunk$set(echo = TRUE, warning = FALSE, message = FALSE, fig.width = 10, fig.height = 6)
```

# Economist-Style Plot using R
  
![](/home/khanhan/heathcare.png)


# R Codes for Data Cleaning and Visualization

Above Economist-Style Plot can be created by using R as follows: 

```{r, eval=FALSE}


#==========================================
#  Collect data from WHO and pre-process
#==========================================

# devtools::install_github("expersso/WHO")

library(WHO)
library(tidyverse)

# Government and total expenditure data: 

expenditure_gov <- get_data("WHS7_108")
expenditure_total <- get_data("WHS7_105")

expenditure_gov %>% 
  filter(year == 2014, !is.na(country)) %>% 
  select(gov_exp = value, country) -> df_gov

expenditure_total %>% 
  filter(year == 2014, !is.na(country)) %>% 
  select(total_exp = value, country) -> df_total

nations <- intersect(df_gov$country, df_total$country)

full_join(df_total %>% filter(country %in% nations), 
          df_gov %>% filter(country %in% nations), by = "country") %>% 
  select(country, everything()) %>% 
  mutate(private_exp = total_exp - gov_exp) %>% 
  mutate(gov_rate = gov_exp / total_exp) %>% 
  arrange(gov_rate) %>% 
  mutate(rank = 1:nrow(.)) -> dfPlot

# Rename: 
dfPlot %>% 
  mutate(country = case_when(country == "Brunei Darussalam" ~ "Brunei", 
                             country == "Republic of Korea" ~ "South Korea", 
                             country == "United Kingdom of Great Britain and Northern Ireland" ~ "United Kingdom", 
                             country == "United States of America" ~ "United States", 
                             country == "Russian Federation" ~ "Russia", 
                             country == "Viet Nam" ~ "Vietnam", 
                             TRUE ~ country)) -> dfPlot

# Some countries selected: 

northernCon <- c("Denmark", "Finland", "Norway", "Sweden")
specialCon <- c("Qatar", "Brunei", "Cuba")
aseanCon <- c("Singapore", "Thailand", "Malaysia", "Vietnam")
others <- c("India", "China", "United States", "United Kingdom", "France", 
           "Germany", "Canada", "Japan", "South Korea")

dfPlot %>% 
  filter(country %in% c(northernCon, specialCon, aseanCon, others)) %>% 
  arrange(gov_rate) -> df

my_levels <- df %>% pull(country)

df %>% 
  mutate(country = factor(country, levels = my_levels)) %>%
  select(country, private_exp, gov_exp) %>% 
  gather(type, value, -country) -> df1

# Colors and font selected: http://pattern-library.economist.com/color.html
# https://yutannihilation.github.io/allYourFigureAreBelongToUs/ggthemes/economist_pal/

my_colors <- c("#014d64", "#01a2d9")
my_font <- "Ubuntu Condensed"
colorLevels <- c("private_exp", "gov_exp")

#==================================
#  Solution 1 (but i do not like)
#==================================

df1 %>% 
  mutate(type = factor(type, levels = colorLevels)) -> df1

df1 %>% 
  ggplot(aes(x = country, y = value, fill = type)) + 
  geom_col(position = "fill") + 
  coord_flip() + 
  scale_fill_manual(values = my_colors) + 
  theme_minimal(base_family = my_font)

#================
#   Solution 2
#================

library(ggrepel)

df %>% 
  mutate(gov_rate = 100*gov_rate, total_rate = 100) %>% 
  mutate(country = factor(country, levels = country)) %>% 
  mutate(label = round(gov_rate, 1) %>% as.character()) %>% 
  mutate(label = case_when(!str_detect(label, "\\.") ~ paste0(label, ".0"), TRUE ~ label)) %>% 
  mutate(label = paste0(label, "%")) %>% 
  mutate(label_money = round(total_exp, 0) %>% scales::dollar()) -> dfSolution2

# Version 1: 

ggplot() + 
  coord_flip() + 
  theme_minimal(base_family = my_font, base_size = 14) + 
  geom_col(data = dfSolution2, aes(x = country, y = total_rate, fill = "Government"), width = 0.9) + 
  geom_col(data = dfSolution2, aes(x = country, y = gov_rate, fill = "Private"), width = 0.9) +
  scale_y_continuous(limits = c(0, 120)) + 
  geom_text(data = dfSolution2, aes(x = country, y = 5, label = label), color = "white", family = my_font, size = 4.5) + 
  scale_fill_manual(values = my_colors) + 
  geom_label_repel(data = dfSolution2, aes(x = country, y = 103, label = label_money), hjust = 0, 
                   family = my_font, size = 4.3, direction = "x", nudge_y = 1, label.r = 0, box.padding = 0) + 
  theme(legend.position = "top") 

# Version 2: 

midd <- (102 + 110) / 2

dfSolution2 %>% 
  mutate(color_label_y = case_when(country == "Vietnam" ~ "#e5001c", TRUE ~ "grey20")) %>% 
  mutate(bold_y = case_when(country == "Vietnam" ~ "bold", TRUE ~ "plain")) -> dfSolution2


ggplot() + 
  coord_flip() + 
  theme_minimal(base_family = my_font, base_size = 14) + 
  geom_col(data = dfSolution2, aes(x = country, y = total_rate, fill = "Private"), width = 0.9) + 
  geom_col(data = dfSolution2, aes(x = country, y = gov_rate, fill = "Government"), width = 0.9) +
  scale_y_continuous(limits = c(0, 110), expand = c(0, 0)) + 
  scale_x_discrete(expand = c(0.08, 0)) + 
  geom_text(data = dfSolution2, aes(x = country, y = 4, label = label), color = "white", family = my_font, size = 4.5) + 
  scale_fill_manual(values = my_colors) + 
  theme(legend.direction = "horizontal") + 
  theme(legend.position = c(0.5, 0.98)) + 
  theme(legend.title = element_blank()) + 
  theme(axis.title = element_blank()) + 
  theme(axis.text.x = element_blank()) + 
  theme(panel.grid = element_blank()) + 
  geom_rect(aes(xmin = 0.5, xmax = Inf, ymin = 102, ymax = 110), fill = "#efefe3") + 
  geom_text(data = dfSolution2 %>% filter(country == "Cuba"), aes(x = country, y = 106, label = "Total"), 
            vjust = -1.9, family = my_font, fontface = "bold", size = 4.5) + 
  geom_text(data = dfSolution2, aes(x = country, y = midd, label = scales::comma(round(total_exp, 0))), 
            family = my_font, size = 4.5, color = "grey30") + 
  theme(plot.margin = unit(rep(0.5, 4), "cm")) + 
  labs(x = NULL, y = NULL, 
       title = "Share of Vietnam government spending on health care, 2014", 
       subtitle = "Heath expenditure per capita in Vietnam was reported at $390 (PPP)\nand share of government spending on health care was 54.1%.", 
       caption = "Source: World Health Organization (WHO)") + 
  theme(plot.title = element_text(size = 23, colour = "grey20"), 
        plot.subtitle = element_text(color = "grey30", size = 15), 
        plot.caption = element_text(color = "grey30", face = "italic", size = 11)) + 
  theme(axis.text.y = element_text(color = dfSolution2$color_label_y, size = 12, face = dfSolution2$bold_y)) 

library(grid)
grid.rect(x = 0.015, y = 0.94, hjust = 1, vjust = 0, gp = gpar(fill = "#e5001c", lwd = 0))  
grid.rect(x = 1, y = 1 - 0.005, hjust = 1, vjust = 0,  gp = gpar(fill = "#e5001c", lwd = 0))   

```

