Reading data

# Source of data: https://tiemchungcovid19.gov.vn/portal
vc = read_excel("~/Dropbox/Bao chi/Coronavirus articles/Vaccination in VN/Az vaccine.xlsx")

df = read_excel("~/Dropbox/Bao chi/Coronavirus articles/Vaccination in VN/Vaccination data.xlsx")
df$Pop1 = df$NDose1/(df$Dose1/100)
df$Pop2 = df$NDose2/(df$Dose2/100)
head(df)
## # A tibble: 6 x 10
##   Province D1                  D2                  Dose1 Dose2 NDose1 NDose2
##   <chr>    <dttm>              <dttm>              <dbl> <dbl>  <dbl>  <dbl>
## 1 Hà Nội   1899-12-31 00:36:09 1899-12-31 00:01:36  2.51  0.11 202523   8978
## 2 Hà Giang 1899-12-31 00:44:13 1899-12-31 00:02:27  3.07  0.17  26251   1448
## 3 Cao Bằng 1899-12-31 00:27:22 1899-12-31 00:20:53  1.9   1.45  10057   7706
## 4 Bắc Kạn  1899-12-31 00:34:51 1899-12-31 00:00:00  2.42  0      7598      0
## 5 Tuyên Q… 1899-12-31 00:25:21 1899-12-31 00:01:18  1.76  0.09  13801    710
## 6 Lào Cai  1899-12-31 01:18:47 1899-12-31 00:00:00  5.47  0     39974     18
## # … with 3 more variables: Pop <dbl>, Pop1 <dbl>, Pop2 <dbl>

Visualization of data

ggplot(data=df, aes(x=reorder(Province, Dose1), y=Dose1, col=Province, fill=Province, label=Dose1)) + geom_bar(stat="identity") + geom_text(col="white", hjust=1.2) + coord_flip() + labs(y="Phần trăm dân số đã tiêm liều 1", x="") + theme(legend.position="none")

ggplot(data=df, aes(x=reorder(Province, Dose2), y=Dose2, col=Province, fill=Province, label=Dose2)) + geom_bar(stat="identity") + geom_text(col="white", hjust=1.2) + coord_flip() + labs(y="Phần trăm dân số đã tiêm liều 2", x="") + theme(legend.position="none")

ggplot(data=df, aes(x=Pop, y=Dose1, col=Province, label= Province)) + geom_point(aes(color= Province)) + geom_smooth(method="lm", formula=y~x+I(x^2)) + geom_text() + theme(legend.position="none") + labs(x="Dân số (1000)", y="Phần trăm liều 1")

ggplot(data=df, aes(x=log(Pop), y=Dose1, col=Province, label= Province)) + geom_point(aes(color= Province)) + geom_smooth(method="lm", formula=y~x+I(x^2)) + geom_text() + theme(legend.position="none") + labs(x="Dân số (log)", y="Phần trăm liều 1")

# Distribution of vaccine 
ggplot(data=vc, aes(x=reorder(Province, AZ.vaccine), y=AZ.vaccine, col=Province, fill=Province, label=AZ.vaccine)) + geom_bar(stat="identity") + geom_text(col="white", hjust=1.2) + coord_flip() + labs(y="AZ vaccine", x="") + theme(legend.position="none")

ddf = merge(df, vc, by="Province")

ggplot(data=ddf, aes(x=log(AZ.vaccine), y=Dose1, col=Province, label= Province)) + geom_point(aes(color= Province)) + geom_smooth(method="lm", formula=y~x+I(x^2)) + geom_text() + theme(legend.position="none") + labs(x="Dân số (log)", y="Phần trăm liều 1")