Calculating totals for each sample
total_sample1_size <- sum(data_frame_sample1_group$size)
total_sample2_size <- sum(data_frame_sample2_group$size)
total_sample3_size <- sum(data_frame_sample3_group$size)
total_sample4_size <- sum(data_frame_sample4_group$size)
total_sample5_size <- sum(data_frame_sample5_group$size)
Probability of having primary as education level for each
sample
primary_education_sample1 <- 3397/total_sample1_size
primary_education_sample2 <- 3317/total_sample2_size
primary_education_sample3 <- 3512/total_sample3_size
primary_education_sample4 <- 3364/total_sample4_size
primary_education_sample5 <- 3404/total_sample5_size
Probability of having secondary as education level for each
sample
secondary_education_sample1 <- 11647/total_sample1_size
secondary_education_sample2 <- 11606/total_sample2_size
secondary_education_sample3 <- 11515/total_sample3_size
secondary_education_sample4 <- 11664/total_sample4_size
secondary_education_sample5 <- 11648/total_sample5_size
Probability of having tertiary as education level for each
sample
tertiary_education_sample1 <- 6644/total_sample1_size
tertiary_education_sample2 <- 6770/total_sample2_size
tertiary_education_sample3 <- 6633/total_sample3_size
tertiary_education_sample4 <- 6637/total_sample4_size
tertiary_education_sample5 <- 6663/total_sample5_size
Probability of having tertiary as education level and having balance
above the average
sample_names <- c("sample1", "sample2","sample3","sample4","sample5")
secondary_education <- c(secondary_education_sample1,secondary_education_sample2,secondary_education_sample3,secondary_education_sample4,secondary_education_sample5)
primary_education <- c(primary_education_sample1,primary_education_sample2,primary_education_sample3,primary_education_sample4,primary_education_sample5)
tertiary_education <- c(tertiary_education_sample1,tertiary_education_sample2,tertiary_education_sample3,tertiary_education_sample4,tertiary_education_sample5)
sample_education_level_probability <- data.frame(sample_names,primary_education,secondary_education,tertiary_education)
sample_education_level_probability
## sample_names primary_education secondary_education tertiary_education
## 1 sample1 0.1565799 0.5368518 0.3062457
## 2 sample2 0.1530405 0.5354803 0.3123558
## 3 sample3 0.1621871 0.5317724 0.3063175
## 4 sample4 0.1550802 0.5377098 0.3059653
## 5 sample5 0.1571851 0.5378648 0.3076745
Plotting the probability and samples
primary_education
p <- sample_education_level_probability |>
ggplot(aes(x = sample_names, y=(primary_education)) )+
geom_bar(position = "dodge", stat = "identity",fill="yellow") +
theme_minimal()
p

# Pie Chart with Percentages
slices <- c(primary_education_sample1,primary_education_sample2, primary_education_sample3, primary_education_sample4, primary_education_sample5)
lbls <- c("primary_education_sample1","primary_education_sample2", "primary_education_sample3", "primary_education_sample4", "primary_education_sample5", "tertiary_above_average")
pct <- round(slices/sum(slices)*100)
lbls <- paste(lbls, pct)
# add percents to labels
lbls <- paste(lbls,"%",sep="") # ad % to labels
pie(slices,labels = lbls, main="Pie Chart - primary_education",col=topo.colors(5))

secondary_education
p <- sample_education_level_probability |>
ggplot(aes(x = sample_names, y=(secondary_education)) )+
geom_bar(position = "dodge", stat = "identity",fill="lightgreen") +
theme_minimal()
p

# Pie Chart with Percentages
slices <- c(secondary_education_sample1,secondary_education_sample2, secondary_education_sample3, secondary_education_sample4, secondary_education_sample5)
lbls <- c("secondary_education_sample1","secondary_education_sample2", "secondary_education_sample3", "secondary_education_sample4", "secondary_education_sample5", "secondary_above_average")
pct <- round(slices/sum(slices)*100)
lbls <- paste(lbls, pct)
# add percents to labels
lbls <- paste(lbls,"%",sep="") # ad % to labels
pie(slices,labels = lbls, main="Pie Chart - secondary_education" )

tertiary_education
p <- sample_education_level_probability |>
ggplot(aes(x = sample_names, y=(tertiary_education)) )+
geom_bar(position = "dodge", stat = "identity",fill="red") +
theme_minimal()
p

library(RColorBrewer)
myPalette <- brewer.pal(5, "Set3")
# Pie Chart with Percentages
slices <- c(tertiary_education_sample1,tertiary_education_sample2, tertiary_education_sample3, tertiary_education_sample4, tertiary_education_sample5)
lbls <- c("tertiary_education_sample1","tertiary_education_sample2", "tertiary_education_sample3", "tertiary_education_sample4", "tertiary_education_sample5", "secondary_above_average")
pct <- round(slices/sum(slices)*100)
lbls <- paste(lbls, pct)
# add percents to labels
lbls <- paste(lbls,"%",sep="") # ad % to labels
pie(slices,labels = lbls, main="Pie Chart - tertiary_education", col=myPalette )
