VMEASURE_DATA <- here("analyses/11_cluster_control/data/ets_cluster_vmeasure.csv")
vmeasure_data <- read_csv(VMEASURE_DATA)
mean_vmeasure <- vmeasure_data %>%
group_by(n_clusters) %>%
multi_boot_standard(col = "vmeasure") %>%
rename(vmeasure = mean) %>%
mutate(lang = "average")
vmeasure_data %>%
filter(lang == "en") %>%
bind_rows(mean_vmeasure) %>%
ggplot(aes(x = n_clusters, y = vmeasure, linetype = lang))+
geom_pointrange(aes(ymin = ci_lower, ymax = ci_upper)) +
geom_line() +
ylab("v-measure") +
ylim(0, 1) +
xlab("Number of clusters") +
theme_classic()
