VMEASURE_DATA <-  here("analyses/11_cluster_control/data/ets_cluster_vmeasure.csv")
vmeasure_data <- read_csv(VMEASURE_DATA)


mean_vmeasure <- vmeasure_data %>%
  group_by(n_clusters) %>%
  multi_boot_standard(col = "vmeasure") %>%
  rename(vmeasure = mean) %>%
  mutate(lang = "average")

vmeasure_data %>%
 filter(lang == "en") %>%
  bind_rows(mean_vmeasure) %>%
  ggplot(aes(x = n_clusters, y = vmeasure, linetype = lang))+
  geom_pointrange(aes(ymin = ci_lower, ymax = ci_upper)) +
  geom_line() +
  ylab("v-measure") +
  ylim(0, 1) +
  xlab("Number of clusters") +
  theme_classic()