Setup

knitr::opts_knit$set(root.dir = here::here())
library(tidyverse)
library(here)
library(jsonlite)
library(assertthat)
library(irr)
pak::pkg_install("hsci-r/gghsci")
library(gghsci)
library(ggbeeswarm)
library(gt)
renv::snapshot()
sorensen <- function(x,y){
    assert_that(is.character(x))
    assert_that(is.character(y))
    index <- 
        2*(length(intersect(x,y)))/(2*(length(intersect(x,y)))+
                                        length(setdiff(x,y))+
                                        length(setdiff(y,x)))
    return(index)
}
sorensen_dist <- function(x,y) {
  return(1-sorensen(x,y))
}

Data loading

AP loading

clarity_bound <- 0.75
quick_bound_centile <- 3
slow_bound_centile <- 7
short_bound_centile <- 3
long_bound_centile <- 7

raw_data <- list.files(here("data/final_annotations"),full.names=T) %>%
  setNames(.,str_replace(basename(.),"annotointi_(.*)\\.csv$","\\1")) %>% 
  map_dfr(~read_csv(.,show_col_types=F),.id="name") %>%
  replace_na(list(theme="not alcohol policy")) %>%
  mutate(document_id=as.numeric(factor(text))) %>%
  group_by(name) %>%
  mutate(lead_time_centile=ntile(lead_time,10),lead_time_quartile=ntile(lead_time,4)) %>%
  ungroup() %>%
  mutate(speed_type=case_when(
    lead_time_centile>=slow_bound_centile ~ "slow",
    lead_time_centile<=quick_bound_centile ~ "quick",
    T ~ "in-between"
  )) %>% 
  mutate(whole_article=is.na(answer)) %>%
  mutate(part_length=map_if(answer,~!is.na(.),~fromJSON(.),.else=~list())) %>%
  mutate(part_length=map(part_length,~.$end-.$start)) %>% 
  mutate(part_length=map_dbl(part_length,~reduce(.,~.x+.y,.init=0))) %>%
  group_by(text)%>%
  mutate(annotations=n()) %>%
  ungroup() %>%
  extract(text,into=c("url"),regex = "^([^ ]*)") %>%
  rename(annotation_document_id=document_id)

md <- bind_rows(
  read_csv(here("data/df_joined_individual.csv")),
  read_csv(here("data/df_joined_interannotator.csv"))
  ) %>%
  mutate(content_length_centile=ntile(nr_characters,10),content_length_quartile=ntile(nr_characters,4)) %>%
  mutate(length_type=case_when(
    content_length_centile<=short_bound_centile ~ "short",
    content_length_centile>=long_bound_centile ~ "long",
    T ~ "in-between"
  ))
New names:
• `` -> `...1`
Rows: 1500 Columns: 25
── Column specification ──────────────────────────────────────────────────────────────────────────
Delimiter: ","
chr  (15): text, url, section, document_id, title, author, subsection, media, subject, genre, ...
dbl   (8): ...1, score, sentences, nr_characters, nr_tokens, paragraphs, document_parts, urgency
dttm  (2): time_created, time_modified

ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
New names:
• `` -> `...1`
Rows: 100 Columns: 25
── Column specification ──────────────────────────────────────────────────────────────────────────
Delimiter: ","
chr  (15): text, url, section, document_id, title, author, subsection, media, subject, genre, ...
dbl   (8): ...1, score, sentences, nr_characters, nr_tokens, paragraphs, document_parts, urgency
dttm  (2): time_created, time_modified

ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
raw_data <- raw_data %>% 
  inner_join(md)
Joining, by = "url"
assert_that(nrow(md)==1600)
[1] TRUE
assert_that(nrow(raw_data)==5500)
[1] TRUE
dl <- bind_rows(
  raw_data %>% filter(str_sub(theme,1,1)!='{') %>% mutate(multiple=F),
  raw_data %>% filter(str_sub(theme,1,1)=='{') %>%
    mutate(theme=map(theme,~fromJSON(.) %>% as.data.frame())) %>% 
    unnest(theme) %>% 
    rename(theme=choices)
  )
New names:
• `...1` -> `...18`
New names:
• `...1` -> `...18`
d <- dl %>% 
  group_by(across(-theme)) %>% 
  arrange(theme) %>%
  summarize(theme=str_c(theme,collapse="|"),.groups="drop") %>% 
  group_by(text,theme) %>% 
  mutate(theme_annotations=n()) %>% 
  group_by(text,speed_type) %>% 
  mutate(speed_type_annotations=n()) %>% 
  group_by(text,whole_article) %>%
  mutate(whole_article_annotations=n()) %>%
  group_by(text) %>% 
  arrange(desc(theme_annotations),theme) %>% 
  mutate(theme_annotation_proportion=theme_annotations/n()) %>% 
  mutate(majority_theme=str_flatten(na.omit(unique(if_else(theme_annotations==max(theme_annotations),theme,NA_character_))),collapse="|"),majority_theme_annotations=first(theme_annotations),majority_theme_proportion=first(theme_annotations)/n()) %>%
  arrange(desc(speed_type_annotations),speed_type) %>% 
  mutate(speed_type_annotation_proportion=speed_type_annotations/n()) %>% 
  mutate(majority_speed_type=str_flatten(na.omit(unique(if_else(speed_type_annotations==max(speed_type_annotations),speed_type,NA_character_))),collapse="|"),majority_speed_type_annotations=first(speed_type_annotations),majority_speed_type_proportion=first(speed_type_annotations)/n()) %>%
  arrange(desc(whole_article_annotations),whole_article) %>% 
  mutate(whole_article_annotation_proportion=whole_article_annotations/n()) %>% 
  mutate(majority_whole_article=str_flatten(na.omit(unique(if_else(whole_article_annotations==max(whole_article_annotations),whole_article,NA))),collapse="|"),majority_whole_article_annotations=first(whole_article_annotations),majority_whole_article_proportion=first(whole_article_annotations)/n()) %>%
  ungroup() %>%
  mutate(
    decision_type=if_else(theme==majority_theme,"assent","dissent"),
    clarity=if_else(majority_theme_proportion>=clarity_bound,"clear","unclear")
  )

assert_that(nrow(d)==5500)
[1] TRUE
bd <- d %>% 
  mutate(theme=if_else(theme=="not alcohol policy",theme,"alcohol policy"))
bd <- bd %>% 
  group_by(text,theme) %>% 
  mutate(n=n()) %>% 
  group_by(text) %>% 
  arrange(desc(n),theme) %>% 
  mutate(prop=n/n()) %>% 
  mutate(majority_theme=str_flatten(na.omit(unique(if_else(n==max(n),theme,NA_character_))),collapse="|"),majority_theme_n=first(n),majority_theme_proportion=first(n)/n()) %>%
  ungroup() %>%
  mutate(
    decision_type=if_else(theme==majority_theme,"assent","dissent"),
    clarity=if_else(majority_theme_proportion>=clarity_bound,"clear","unclear")
  )

bmd <- md %>%
  inner_join(bd %>% distinct(url,annotations,majority_theme,majority_theme_annotations,majority_theme_proportion,clarity,majority_speed_type,majority_speed_type_annotations,majority_speed_type_proportion,majority_whole_article))
Joining, by = "url"
assert_that(nrow(bmd)==1600)
[1] TRUE
md <- md %>% 
  inner_join(d %>% distinct(url,annotations,majority_theme,majority_theme_annotations,majority_theme_proportion,clarity,majority_speed_type,majority_speed_type_annotations,majority_speed_type_proportion,majority_whole_article))
Joining, by = "url"
assert_that(nrow(md)==1600)
[1] TRUE

MV loading

mvd <- list.files(here("data/mv_annotations/"),full.names=T) %>%
  setNames(.,str_replace(basename(.),"annotator_(.*)\\.csv$","\\1")) %>% 
  map_dfr(~read_csv(.,show_col_types=F),.id="name") %>%
  replace_na(list(sentiment="empty")) %>%
  filter(sentiment!="empty") %>%
  mutate(document_id=as.numeric(factor(text))) %>%
  group_by(name) %>%
  mutate(lead_time_centile=ntile(lead_time,10),lead_time_quartile=ntile(lead_time,4)) %>%
  ungroup() %>%
  mutate(speed_type=case_when(
    lead_time_centile>=slow_bound_centile ~ "slow",
    lead_time_centile<=quick_bound_centile ~ "quick",
    T ~ "in-between"
  )) %>% 
  group_by(text,sentiment) %>% 
  mutate(sentiment_annotations=n()) %>% 
  group_by(text,speed_type) %>% 
  mutate(speed_type_annotations=n()) %>% 
  group_by(text) %>% 
  arrange(desc(sentiment_annotations)) %>% 
  mutate(sentiment_annotation_proportion=sentiment_annotations/n()) %>% 
  mutate(majority_sentiment=first(sentiment),majority_sentiment_annotations=first(sentiment_annotations),majority_sentiment_proportion=first(sentiment_annotations)/n()) %>%
  arrange(desc(speed_type_annotations),speed_type) %>% 
  mutate(speed_type_annotation_proportion=speed_type_annotations/n()) %>% 
  mutate(majority_speed_type=str_flatten(na.omit(unique(if_else(speed_type_annotations==max(speed_type_annotations),speed_type,NA_character_))),collapse="|"),majority_speed_type_annotations=first(speed_type_annotations),majority_speed_type_proportion=first(speed_type_annotations)/n()) %>%
  ungroup() %>%
  mutate(
    decision_type=if_else(sentiment==majority_sentiment,"assent","dissent"),
    clarity=if_else(majority_sentiment_proportion>=clarity_bound,"clear","unclear")
  )

mvmd <- read_csv(here("data/MV_data_final_links.csv"),col_select=c("content","link")) %>% 
  mutate(content_length=str_length(content)) %>%
  mutate(content_length_centile=ntile(content_length,10),content_length_quartile=ntile(content_length,4))  %>%
  mutate(length_type=case_when(
    content_length_centile<=short_bound_centile ~ "short",
    content_length_centile>=long_bound_centile ~ "long",
    T ~ "in-between"
  )) %>% rename(text=link)
New names:
• `` -> `...1`
Rows: 997 Columns: 2
── Column specification ──────────────────────────────────────────────────────────────────────────
Delimiter: ","
chr (2): content, link

ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
mvd <- mvd %>% inner_join(mvmd)
Joining, by = "text"
mvmd <- mvmd %>% inner_join(mvd %>% distinct(text,majority_sentiment,majority_sentiment_annotations,majority_sentiment_proportion,clarity,majority_speed_type,majority_speed_type_annotations,majority_speed_type_proportion))
Joining, by = "text"
assert_that(nrow(mvmd)==98)
[1] TRUE

Binary alcohol policy analyses

Majority theme proportions

N Proportion
not alcohol policy 936 58.50%
alcohol policy 660 41.25%
alcohol policy|not alcohol policy 4 0.25%

60/40 split between not AP and AP is a pretty even base.

Decision clarity by majority theme

N Proportion
alcohol policy
clear 445 67.42%
unclear 215 32.58%
not alcohol policy
clear 757 80.88%
unclear 179 19.12%

There are proportionally more clear decisions for not alcohol policy than there are for alcohol policy -> it is easier to say that something is not AP than to say that something is AP.

Theme, clarity and speed type cross investigation

There is a subset of articles where it is quick to decide that they are not AP.

Theme, clarity and whole/part investigation

When an article deals only partially with alcohol, it is more likely to not be an alcohol policy article. It is harder to clearly decide whether an article not dealing completely with alcohol is AP or not as compared to an article wholly dealing with alcohol.

Theme, clarity, speed type and length cross investigation

Unsurprisingly, longer articles take longer to decide upon. Short non-AP articles are particularly easy to categorize clearly, but there is also the potential for error here, as evidenced by the high number of “unclear” quick selections in the short articles.

Alcohol policy annotator analyses

Time to decide by annotator

Very clearly different task time profiles between annotators.

Agreement matrix between annotators

p <- scales::percent_format(accuracy=1)
bd %>% 
  full_join(bd,by=c("text")) %>%
  mutate(agree=theme.x==theme.y) %>%
  group_by(name.x,name.y) %>%
  summarize(agree=sum(agree),pagree=sum(agree)/n(),.groups="drop") %>%
  ggplot(aes(x=name.x,y=name.y,fill=pagree)) +
  geom_raster() +
  theme_hsci() +
  scale_fill_viridis_c(labels=scales::percent_format(accuracy=1)) +
  geom_text(aes(label=p(pagree))) +
  labs(fill="Agreement") +
  xlab("Annotator 1") +
  ylab("Annotator 2")

Kaisa stands out as an annotator with lower agreement to the majority of other annotators, except interestingly Sonja and Susanna.

Proportion of annotators indicating the majority viewpoint

Time taken to annotate by annotator and clarity

Almost all annotators are likely to spend more time on “problematic” articles, here proxied by their clarity(=the amount of general agreement wrt them). -> the annotators are doing a good job, and most errors should not be caused by carelessness but by actual decision differences and ambiguities in guidelines.

Annotation time difference based on agreement between annotator pairs

At the same time, there is also clearly an effect visible where difference in annotation time explains agreement, so there is also an attentiveness component to the disagreements.

Heuristics for testing whether outlier annotator should be removed

kripp.alpha(bd %>% 
              pivot_wider(id_cols=name,names_from=document_id,values_from=theme) %>%
              select(-name) %>% 
              as.matrix,
            method="nominal")
Warning in kripp.alpha(bd %>% pivot_wider(id_cols = name, names_from = document_id,  :
  NAs introduced by coercion
 Krippendorff's alpha

 Subjects = 1600 
   Raters = 10 
    alpha = 0.657 
kripp.alpha(bd %>% 
              filter(name!="Kaisa") %>%
              pivot_wider(id_cols=name,names_from=document_id,values_from=theme) %>%
              select(-name) %>% 
              as.matrix,
            method="nominal")
Warning in kripp.alpha(bd %>% filter(name != "Kaisa") %>% pivot_wider(id_cols = name,  :
  NAs introduced by coercion
 Krippendorff's alpha

 Subjects = 1600 
   Raters = 9 
    alpha = 0.688 

MV analyses

Majority sentiment proportions

N Proportion
Sisällön kopiointi valtamediasta 69 70.41%
Oman narratiivin rakentaminen lähdeviitteiden avulla 24 24.49%
Journalistisen median kritiikki 5 5.10%

70% of this data is copying from mainstream media. 24 articles is probably enough to analyse the developing of one’s own narrative, but there are really too few “criticism of mainstream media” articles to draw conclusions from.

Decision clarity by majority sentiment

N Proportion
Journalistisen median kritiikki
clear 4 80.00%
unclear 1 20.00%
Oman narratiivin rakentaminen lähdeviitteiden avulla
clear 16 66.67%
unclear 8 33.33%
Sisällön kopiointi valtamediasta
clear 66 95.65%
unclear 3 4.35%

Identifying the copying of material from mainstream media seems quite clear, as opposed to whether something is building their own narrative.

The confusion matrix between annotation pairs tells a bit more:

Here, it seems that it is hard to draw boundaries between the development of one’s own narrative and both journalistic critique as well as copying.

Sentiment, clarity and speed type cross investigation

Again, too few critique articles to draw conclusions from. Otherwise, seems that the only clear category identified quickly is a subset of articles copying content from mainstream media. Even for clear cases of building one’s own narrative, decisions take long to reach.

Theme, clarity, speed type and length cross investigation

Here even more categories lack data to base decisions on. What we can see is that copying can be relatively quickly identified in all length categories, and that own narrative articles are often long and slow to parse.

MV annotator analyses

Again, we have two different annotator profiles evident.

Agreement matrix between annotators

No clear outlier annotators appear in this task:

Proportion of annotators indicating the majority viewpoint

Time taken to annotate by annotator and whether all annotators agree

Here again, annotators are likely to spend more time on “problematic” articles, here proxied by their clarity(=the amount of general agreement wrt them). An interesting exception is the own narrative category, where unclear decisions may have been due to making them in haste.

Annotation time difference based on agreement between annotator pairs

Again, there is also clearly an effect visible where difference in annotation time explains agreement.

Categorical data is here a bit sparse to draw conclusions, but may further point to attentiveness differences in explaining disagreement on the boundaries of the own narrative category. Similarly, because the critique category requires picking up on individual sentence ques, time taken may explain some of the difference for that category.

---
title: "R Notebook"
output: 
  html_notebook:
    code_folding: hide
    toc: true
---

# Setup

```{r setup}
knitr::opts_knit$set(root.dir = here::here())
```

```{r,results='hide'}
library(tidyverse)
library(here)
library(jsonlite)
library(assertthat)
library(irr)
pak::pkg_install("hsci-r/gghsci")
library(gghsci)
library(ggbeeswarm)
library(gt)
renv::snapshot()
```

```{r}
sorensen <- function(x,y){
    assert_that(is.character(x))
    assert_that(is.character(y))
    index <- 
        2*(length(intersect(x,y)))/(2*(length(intersect(x,y)))+
                                        length(setdiff(x,y))+
                                        length(setdiff(y,x)))
    return(index)
}
sorensen_dist <- function(x,y) {
  return(1-sorensen(x,y))
}
```

# Data loading

## AP loading

```{r}
clarity_bound <- 0.75
quick_bound_centile <- 3
slow_bound_centile <- 7
short_bound_centile <- 3
long_bound_centile <- 7

raw_data <- list.files(here("data/final_annotations"),full.names=T) %>%
  setNames(.,str_replace(basename(.),"annotointi_(.*)\\.csv$","\\1")) %>% 
  map_dfr(~read_csv(.,show_col_types=F),.id="name") %>%
  replace_na(list(theme="not alcohol policy")) %>%
  mutate(document_id=as.numeric(factor(text))) %>%
  group_by(name) %>%
  mutate(lead_time_centile=ntile(lead_time,10),lead_time_quartile=ntile(lead_time,4)) %>%
  ungroup() %>%
  mutate(speed_type=case_when(
    lead_time_centile>=slow_bound_centile ~ "slow",
    lead_time_centile<=quick_bound_centile ~ "quick",
    T ~ "in-between"
  )) %>% 
  mutate(whole_article=is.na(answer)) %>%
  mutate(part_length=map_if(answer,~!is.na(.),~fromJSON(.),.else=~list())) %>%
  mutate(part_length=map(part_length,~.$end-.$start)) %>% 
  mutate(part_length=map_dbl(part_length,~reduce(.,~.x+.y,.init=0))) %>%
  group_by(text)%>%
  mutate(annotations=n()) %>%
  ungroup() %>%
  extract(text,into=c("url"),regex = "^([^ ]*)") %>%
  rename(annotation_document_id=document_id)

md <- bind_rows(
  read_csv(here("data/df_joined_individual.csv")),
  read_csv(here("data/df_joined_interannotator.csv"))
  ) %>%
  mutate(content_length_centile=ntile(nr_characters,10),content_length_quartile=ntile(nr_characters,4)) %>%
  mutate(length_type=case_when(
    content_length_centile<=short_bound_centile ~ "short",
    content_length_centile>=long_bound_centile ~ "long",
    T ~ "in-between"
  ))

raw_data <- raw_data %>% 
  inner_join(md)

assert_that(nrow(md)==1600)
assert_that(nrow(raw_data)==5500)

dl <- bind_rows(
  raw_data %>% filter(str_sub(theme,1,1)!='{') %>% mutate(multiple=F),
  raw_data %>% filter(str_sub(theme,1,1)=='{') %>%
    mutate(theme=map(theme,~fromJSON(.) %>% as.data.frame())) %>% 
    unnest(theme) %>% 
    rename(theme=choices)
  )

d <- dl %>% 
  group_by(across(-theme)) %>% 
  arrange(theme) %>%
  summarize(theme=str_c(theme,collapse="|"),.groups="drop") %>% 
  group_by(text,theme) %>% 
  mutate(theme_annotations=n()) %>% 
  group_by(text,speed_type) %>% 
  mutate(speed_type_annotations=n()) %>% 
  group_by(text,whole_article) %>%
  mutate(whole_article_annotations=n()) %>%
  group_by(text) %>% 
  arrange(desc(theme_annotations),theme) %>% 
  mutate(theme_annotation_proportion=theme_annotations/n()) %>% 
  mutate(majority_theme=str_flatten(na.omit(unique(if_else(theme_annotations==max(theme_annotations),theme,NA_character_))),collapse="|"),majority_theme_annotations=first(theme_annotations),majority_theme_proportion=first(theme_annotations)/n()) %>%
  arrange(desc(speed_type_annotations),speed_type) %>% 
  mutate(speed_type_annotation_proportion=speed_type_annotations/n()) %>% 
  mutate(majority_speed_type=str_flatten(na.omit(unique(if_else(speed_type_annotations==max(speed_type_annotations),speed_type,NA_character_))),collapse="|"),majority_speed_type_annotations=first(speed_type_annotations),majority_speed_type_proportion=first(speed_type_annotations)/n()) %>%
  arrange(desc(whole_article_annotations),whole_article) %>% 
  mutate(whole_article_annotation_proportion=whole_article_annotations/n()) %>% 
  mutate(majority_whole_article=str_flatten(na.omit(unique(if_else(whole_article_annotations==max(whole_article_annotations),whole_article,NA))),collapse="|"),majority_whole_article_annotations=first(whole_article_annotations),majority_whole_article_proportion=first(whole_article_annotations)/n()) %>%
  ungroup() %>%
  mutate(
    decision_type=if_else(theme==majority_theme,"assent","dissent"),
    clarity=if_else(majority_theme_proportion>=clarity_bound,"clear","unclear")
  )

assert_that(nrow(d)==5500)

bd <- d %>% 
  mutate(theme=if_else(theme=="not alcohol policy",theme,"alcohol policy"))
bd <- bd %>% 
  group_by(text,theme) %>% 
  mutate(n=n()) %>% 
  group_by(text) %>% 
  arrange(desc(n),theme) %>% 
  mutate(prop=n/n()) %>% 
  mutate(majority_theme=str_flatten(na.omit(unique(if_else(n==max(n),theme,NA_character_))),collapse="|"),majority_theme_n=first(n),majority_theme_proportion=first(n)/n()) %>%
  ungroup() %>%
  mutate(
    decision_type=if_else(theme==majority_theme,"assent","dissent"),
    clarity=if_else(majority_theme_proportion>=clarity_bound,"clear","unclear")
  )

bmd <- md %>%
  inner_join(bd %>% distinct(url,annotations,majority_theme,majority_theme_annotations,majority_theme_proportion,clarity,majority_speed_type,majority_speed_type_annotations,majority_speed_type_proportion,majority_whole_article))

assert_that(nrow(bmd)==1600)

md <- md %>% 
  inner_join(d %>% distinct(url,annotations,majority_theme,majority_theme_annotations,majority_theme_proportion,clarity,majority_speed_type,majority_speed_type_annotations,majority_speed_type_proportion,majority_whole_article))

assert_that(nrow(md)==1600)

```

## MV loading

```{r}
mvd <- list.files(here("data/mv_annotations/"),full.names=T) %>%
  setNames(.,str_replace(basename(.),"annotator_(.*)\\.csv$","\\1")) %>% 
  map_dfr(~read_csv(.,show_col_types=F),.id="name") %>%
  replace_na(list(sentiment="empty")) %>%
  filter(sentiment!="empty") %>%
  mutate(document_id=as.numeric(factor(text))) %>%
  group_by(name) %>%
  mutate(lead_time_centile=ntile(lead_time,10),lead_time_quartile=ntile(lead_time,4)) %>%
  ungroup() %>%
  mutate(speed_type=case_when(
    lead_time_centile>=slow_bound_centile ~ "slow",
    lead_time_centile<=quick_bound_centile ~ "quick",
    T ~ "in-between"
  )) %>% 
  group_by(text,sentiment) %>% 
  mutate(sentiment_annotations=n()) %>% 
  group_by(text,speed_type) %>% 
  mutate(speed_type_annotations=n()) %>% 
  group_by(text) %>% 
  arrange(desc(sentiment_annotations)) %>% 
  mutate(sentiment_annotation_proportion=sentiment_annotations/n()) %>% 
  mutate(majority_sentiment=first(sentiment),majority_sentiment_annotations=first(sentiment_annotations),majority_sentiment_proportion=first(sentiment_annotations)/n()) %>%
  arrange(desc(speed_type_annotations),speed_type) %>% 
  mutate(speed_type_annotation_proportion=speed_type_annotations/n()) %>% 
  mutate(majority_speed_type=str_flatten(na.omit(unique(if_else(speed_type_annotations==max(speed_type_annotations),speed_type,NA_character_))),collapse="|"),majority_speed_type_annotations=first(speed_type_annotations),majority_speed_type_proportion=first(speed_type_annotations)/n()) %>%
  ungroup() %>%
  mutate(
    decision_type=if_else(sentiment==majority_sentiment,"assent","dissent"),
    clarity=if_else(majority_sentiment_proportion>=clarity_bound,"clear","unclear")
  )

mvmd <- read_csv(here("data/MV_data_final_links.csv"),col_select=c("content","link")) %>% 
  mutate(content_length=str_length(content)) %>%
  mutate(content_length_centile=ntile(content_length,10),content_length_quartile=ntile(content_length,4))  %>%
  mutate(length_type=case_when(
    content_length_centile<=short_bound_centile ~ "short",
    content_length_centile>=long_bound_centile ~ "long",
    T ~ "in-between"
  )) %>% rename(text=link)

mvd <- mvd %>% inner_join(mvmd)

mvmd <- mvmd %>% inner_join(mvd %>% distinct(text,majority_sentiment,majority_sentiment_annotations,majority_sentiment_proportion,clarity,majority_speed_type,majority_speed_type_annotations,majority_speed_type_proportion))

assert_that(nrow(mvmd)==98)
```

# Binary alcohol policy analyses

## Majority theme proportions

```{r}
bmd %>% 
  count(majority_theme) %>%
  mutate(majority_theme_proportion=n/sum(n)) %>%
  arrange(desc(n)) %>%
  gt(rowname_col="majority_theme") %>%
  cols_label(n="N",majority_theme_proportion="Proportion") %>%
  fmt_percent(columns = c(majority_theme_proportion))
```

60/40 split between not AP and AP is a pretty even base.

## Decision clarity by majority theme

```{r}
bmd %>% 
  count(majority_theme,clarity) %>%
  filter(majority_theme!="alcohol policy|not alcohol policy") %>%
  group_by(majority_theme) %>%
  mutate(majority_theme_proportion=n/sum(n)) %>%
  ungroup() %>%
  arrange(majority_theme,clarity) %>%
  gt(groupname_col="majority_theme",rowname_col="clarity") %>%
  cols_label(n="N",majority_theme_proportion="Proportion") %>%
  fmt_percent(columns = c(majority_theme_proportion))  
```

There are proportionally more clear decisions for not alcohol policy than there are for alcohol policy -> it is easier to say that something is not AP than to say that something is AP.

## Theme, clarity and speed type cross investigation

```{r}
bmd %>% 
  mutate(majority_speed_type=fct_lump_n(majority_speed_type,4)) %>%
  count(majority_theme,clarity,majority_speed_type) %>%
  group_by(majority_theme,clarity) %>%
  mutate(majority_speed_type_proportion=n/sum(n)) %>%
  ungroup() %>%
  filter(majority_theme!="alcohol policy|not alcohol policy") %>%
  ggplot(aes(x=clarity,fill=majority_speed_type,y=majority_speed_type_proportion)) +
  geom_col() +
  theme_hsci_discrete() + 
  facet_wrap(~majority_theme)
```

There is a subset of articles where it is quick to decide that they are not AP.

## Theme, clarity and whole/part investigation

```{r}
bmd %>% 
  count(majority_theme,clarity,majority_whole_article) %>%
  filter(majority_whole_article!="FALSE|TRUE") %>%
  group_by(majority_theme,clarity) %>%
  mutate(majority_whole_article_proportion=n/sum(n)) %>%
  ungroup() %>%
  filter(majority_theme!="alcohol policy|not alcohol policy") %>%
  ggplot(aes(x=clarity,fill=majority_whole_article,y=majority_whole_article_proportion)) +
  geom_col() +
  theme_hsci_discrete() + 
  facet_wrap(~majority_theme)
```

When an article deals only partially with alcohol, it is more likely to not be an alcohol policy article. It is harder to clearly decide whether an article not dealing completely with alcohol is AP or not as compared to an article wholly dealing with alcohol.

## Theme, clarity, speed type and length cross investigation

```{r}
bmd %>% 
  mutate(majority_speed_type=fct_lump_n(majority_speed_type,4)) %>%
  count(majority_theme,clarity,majority_speed_type,content_length_quartile) %>%
  group_by(majority_theme,clarity,content_length_quartile) %>%
  mutate(majority_speed_type_proportion=n/sum(n)) %>%
  ungroup() %>%
  filter(majority_theme!="alcohol policy|not alcohol policy") %>%
  ggplot(aes(x=clarity,fill=majority_speed_type,y=majority_speed_type_proportion)) +
  geom_col() +
  theme_hsci_discrete() + 
  facet_grid(majority_theme~content_length_quartile)
```

Unsurprisingly, longer articles take longer to decide upon. Short non-AP articles are particularly easy to categorize clearly, but there is also the potential for error here, as evidenced by the high number of "unclear" quick selections in the short articles.

# Alcohol policy annotator analyses

## Time to decide by annotator

```{r}
dl %>% ggplot(aes(x=name,y=lead_time/60,color=theme)) + 
  geom_quasirandom(size=0.5,show.legend=F) +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  scale_y_continuous(breaks=seq(0,5,by=1)) +
  xlab("Annotator") +
  ylab("Time to decide (minutes)")
```

Very clearly different task time profiles between annotators.

## Agreement matrix between annotators

```{r}
p <- scales::percent_format(accuracy=1)
bd %>% 
  full_join(bd,by=c("text")) %>%
  mutate(agree=theme.x==theme.y) %>%
  group_by(name.x,name.y) %>%
  summarize(agree=sum(agree),pagree=sum(agree)/n(),.groups="drop") %>%
  ggplot(aes(x=name.x,y=name.y,fill=pagree)) +
  geom_raster() +
  theme_hsci() +
  scale_fill_viridis_c(labels=scales::percent_format(accuracy=1)) +
  geom_text(aes(label=p(pagree))) +
  labs(fill="Agreement") +
  xlab("Annotator 1") +
  ylab("Annotator 2")
```

Kaisa stands out as an annotator with lower agreement to the majority of other annotators, except interestingly Sonja and Susanna.

## Proportion of annotators indicating the majority viewpoint

```{r}
bmd %>% 
  ggplot(aes(x=majority_theme_proportion)) +
  geom_bar() + 
  theme_hsci_discrete() +
  scale_x_continuous(labels=scales::percent_format(accuracy=1)) +
  xlab("Proportion of annotators indicating the majority viewpoint") +
  ylab("Number of articles") +
  facet_wrap(~annotations,scales="free")
```

## Time taken to annotate by annotator and clarity

```{r,fig.width=10}
bd %>%
  ggplot(aes(x=name,y=lead_time/60,color=clarity)) + 
  geom_boxplot(size=0.5) +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  scale_y_continuous(breaks=seq(0,5,by=1)) +
  xlab("Annotator") +
  labs(color="Clarity") +
  ylab("Time to decide (minutes)") + 
  facet_grid(annotations~theme,scales="free") +
  theme(legend.position="bottom")
  
```

Almost all annotators are likely to spend more time on "problematic" articles, here proxied by their clarity(=the amount of general agreement wrt them). -> the annotators are doing a good job, and most errors should not be caused by carelessness but by actual decision differences and ambiguities in guidelines.

## Annotation time difference based on agreement between annotator pairs

```{r}
bd %>% 
  full_join(bd,by=c("text")) %>%
  mutate(agree=theme.x==theme.y,tdiff=abs(lead_time_centile.x-lead_time_centile.y)) %>%
  ggplot(aes(x=agree,y=tdiff)) +
  geom_boxplot() +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  xlab("Agreement between annotators") +
  ylab("Difference in annotation time centile")
```

At the same time, there is also clearly an effect visible where difference in annotation time explains agreement, so there is also an attentiveness component to the disagreements.

## Heuristics for testing whether outlier annotator should be removed

```{r}
kripp.alpha(bd %>% 
              pivot_wider(id_cols=name,names_from=document_id,values_from=theme) %>%
              select(-name) %>% 
              as.matrix,
            method="nominal")
kripp.alpha(bd %>% 
              filter(name!="Kaisa") %>%
              pivot_wider(id_cols=name,names_from=document_id,values_from=theme) %>%
              select(-name) %>% 
              as.matrix,
            method="nominal")
```

# MV analyses

## Majority sentiment proportions

```{r}
mvmd %>% 
  count(majority_sentiment) %>%
  mutate(majority_sentiment_proportion=n/sum(n)) %>%
  arrange(desc(n)) %>%
  gt(rowname_col="majority_sentiment") %>%
  cols_label(n="N",majority_sentiment_proportion="Proportion") %>%
  fmt_percent(columns = c(majority_sentiment_proportion))
```

70% of this data is copying from mainstream media. 24 articles is probably enough to analyse the developing of one's own narrative, but there are really too few "criticism of mainstream media" articles to draw conclusions from.

## Decision clarity by majority sentiment

```{r}
mvmd %>% 
  count(majority_sentiment,clarity) %>%
  group_by(majority_sentiment) %>%
  mutate(majority_sentiment_proportion=n/sum(n)) %>%
  ungroup() %>%
  arrange(majority_sentiment,clarity) %>%
  gt(groupname_col="majority_sentiment",rowname_col="clarity") %>%
  cols_label(n="N",majority_sentiment_proportion="Proportion") %>%
  fmt_percent(columns = c(majority_sentiment_proportion))    
```

Identifying the copying of material from mainstream media seems quite clear, as opposed to whether something is building their own narrative.

The confusion matrix between annotation pairs tells a bit more:
```{r}
mvd %>% 
  full_join(mvd,by=c("text")) %>%
  filter(name.x!=name.y) %>%
  count(sentiment.x,sentiment.y) %>%
  mutate(sentiment.x=str_trunc(sentiment.x,10)) %>%
  ggplot(aes(x=sentiment.x,y=sentiment.y,fill=n)) +
  geom_raster() +
  theme_hsci_continuous() +
  geom_label(aes(label=n),fill="white") +
  labs(fill="Annotation pairs") +
  xlab("Annotation 2") +
  ylab("Annotation 1") + 
  theme(axis.text.x = element_text(angle = 90, vjust = 0.5, hjust=1))
```

Here, it seems that it is hard to draw boundaries between the development of one's own narrative and both journalistic critique as well as copying. 

## Sentiment, clarity and speed type cross investigation

```{r}
mvmd %>% 
  mutate(majority_speed_type=fct_lump_n(majority_speed_type,4)) %>%
  count(majority_sentiment,clarity,majority_speed_type) %>%
  group_by(majority_sentiment,clarity) %>%
  mutate(majority_speed_type_proportion=n/sum(n)) %>%
  ungroup() %>%
  ggplot(aes(x=clarity,fill=majority_speed_type,y=majority_speed_type_proportion)) +
  geom_col() +
  geom_label(aes(label=n),position=position_stack(vjust=0.5)) +
  theme_hsci_discrete() + 
  facet_wrap(~majority_sentiment)
```

Again, too few critique articles to draw conclusions from. Otherwise, seems that the only clear category identified quickly is a subset of articles copying content from mainstream media. Even for clear cases of building one's own narrative, decisions take long to reach.

## Theme, clarity, speed type and length cross investigation

```{r}
mvmd %>% 
  mutate(majority_speed_type=fct_lump_n(majority_speed_type,4)) %>%
  count(majority_sentiment,clarity,majority_speed_type,content_length_quartile) %>%
  group_by(majority_sentiment,clarity,content_length_quartile) %>%
  mutate(majority_speed_type_proportion=n/sum(n)) %>%
  ungroup() %>%
  ggplot(aes(x=clarity,fill=majority_speed_type,y=majority_speed_type_proportion)) +
  geom_col() +
  geom_label(aes(label=n),position=position_stack(vjust=0.5)) +
  theme_hsci_discrete() + 
  facet_grid(majority_sentiment~content_length_quartile)
```

Here even more categories lack data to base decisions on. What we can see is that copying can be relatively quickly identified in all length categories, and that own narrative articles are often long and slow to parse.

# MV annotator analyses

```{r}
mvd %>% ggplot(aes(x=name,y=lead_time/60,color=sentiment)) + 
  geom_quasirandom(size=0.5,show.legend=F) +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  scale_y_continuous(breaks=seq(0,5,by=1)) +
  xlab("Annotator") +
  ylab("Time to decide (minutes)")
```

Again, we have two different annotator profiles evident.

## Agreement matrix between annotators

No clear outlier annotators appear in this task:

```{r}
p <- scales::percent_format(accuracy=1)
mvd %>% 
  full_join(mvd,by=c("text")) %>%
  mutate(agree=sentiment.x==sentiment.y) %>%
  group_by(name.x,name.y) %>%
  summarize(agree=sum(agree),pagree=sum(agree)/n(),.groups="drop") %>%
  ggplot(aes(x=name.x,y=name.y,fill=pagree)) +
  geom_raster() +
  theme_hsci() +
  scale_fill_viridis_c(labels=scales::percent_format(accuracy=1)) +
  geom_text(aes(label=p(pagree))) +
  labs(fill="Agreement") +
  xlab("Annotator 1") +
  ylab("Annotator 2")
```

## Proportion of annotators indicating the majority viewpoint

```{r}
mvmd %>% 
  ggplot(aes(x=majority_sentiment_proportion)) +
  geom_bar() + 
  theme_hsci_discrete() +
  scale_x_continuous(labels=scales::percent_format(accuracy=1)) +
  xlab("Proportion of annotators indicating the majority viewpoint") +
  ylab("Number of articles") 
```

## Time taken to annotate by annotator and whether all annotators agree

```{r,fig.width=10}
mvd %>%
  ggplot(aes(x=name,y=lead_time/60,color=clarity)) + 
  geom_boxplot(size=0.5) +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  scale_y_continuous(breaks=seq(0,5,by=1)) +
  xlab("Annotator") +
  labs(color="Clarity") +
  ylab("Time to decide (minutes)") + 
  facet_wrap(~sentiment,scales="free") +
  theme(legend.position="bottom")
  
```
Here again, annotators are likely to spend more time on "problematic" articles, here proxied by their clarity(=the amount of general agreement wrt them). An interesting exception is the own narrative category, where unclear decisions may have been due to making them in haste.

## Annotation time difference based on agreement between annotator pairs

```{r}
mvd %>% 
  full_join(mvd,by=c("text")) %>%
  mutate(agree=sentiment.x==sentiment.y,tdiff=abs(lead_time_centile.x-lead_time_centile.y)) %>%
  ggplot(aes(x=agree,y=tdiff)) +
  geom_boxplot() +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  xlab("Agreement between annotators") +
  ylab("Difference in annotation speed centiles")
```

Again, there is also clearly an effect visible where difference in annotation time explains agreement.

```{r}
mvd %>% 
  full_join(mvd,by=c("text","majority_sentiment")) %>%
  mutate(agree=sentiment.x==sentiment.y,tdiff=abs(lead_time_centile.x-lead_time_centile.y)) %>%
  ggplot(aes(x=agree,y=tdiff,color=majority_sentiment)) +
  geom_boxplot() +
  coord_cartesian(ylim=c(0,5)) +
  theme_hsci_discrete() +
  xlab("Agreement between annotators") +
  ylab("Difference in annotation speed centiles")
```

Categorical data is here a bit sparse to draw conclusions, but may further point to attentiveness differences in explaining disagreement on the boundaries of the own narrative category. Similarly, because the critique category requires picking up on individual sentence ques, time taken may explain some of the difference for that category.