Document set-up

1.) Import data and format data

library(tidyverse)
library(lubridate)
library(DT)
library(stringr)

'%!in%' <- function(x,y)!('%in%'(x,y))

# Set working directory to file location
setwd("~/Documents/GitHub/2020-10-campaign-contributions/workspace")

#import candidates from primary and general
candidates <- read_csv('data/candidates.csv')
#candidates not on ballot
not_on_ballot <- read_csv('committees_not_on_ballot.csv')
# import 2020 contributions from individuals to state races.
contributions.raw <- read_csv('data/all_contributions_2020.csv')
  
# convert names to snake_case
colnames(contributions.raw) <- gsub(' ', '_', tolower(colnames(contributions.raw)))

contributions.noParty <- contributions.raw %>% 
    mutate(contribution_date = as.Date(contribution_date, format='%m/%d/%Y') )  %>% 
    # removes records where office is NA, leaving only contributions to committees supporting candidates
    # removes candidate laons
    filter(
      !is.na(office),
      contribution_type != 'Candidate Loan'
    )


# join party data from candidate list
contributions <- left_join(
  contributions.noParty %>% 
    filter(
      receiving_committee %!in% not_on_ballot$committee
    ) %>% 
    mutate(
      committeeJoin = gsub(' ','', receiving_committee)
    ),
  candidates %>% 
    select(committee, party, ballotName, inGeneral) %>% 
    mutate(
      committeeJoin = gsub(' ','', committee)
    ),
  by = 'committeeJoin'
) %>% 
  filter(!is.na(party)) %>%
  select(-filing_period) %>% 
  distinct()
# original      17,704
# not on ballot 17,311
# no party join 17,117
# distinct      15,873











contributions.individuals <- contributions %>% 
  filter(
      contributor_type %in% c('Individual', "Total of Contributions not exceeding $100"),
      contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")
    )

Data overview

key value
contributions all non-candidate-loan contributions to any candidate committee (where
is.na(Office)
& contribution_type != 'Candidate Loan' )
contributions.individuals direct monetary contributions from individuals to any candidate committee (where
contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")
& is.na(Office)
& contributor_type == 'Individual'
)
candidates all candidates in the Delaware primary and general elections
contributions.raw all contributions to any committee

Questions

Total

How much money has been contributed total?

What groups or individuals are the top donors to each party?

`summarise()` regrouping output by 'contributor_name' (override with `.groups` argument)

What groups or people donated to candidates from both parties?

`summarise()` ungrouping output (override with `.groups` argument)

Contributions where contributor_name contains “Police”

Individuals

How much money has been contributed by individuals total?

How much money has been contributed by individuals to each party

contributions.individuals %>% 
  group_by(party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` ungrouping output (override with `.groups` argument)

Who the top donors among individuals?

contributions.individuals %>% 
  group_by(contributor_name) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` ungrouping output (override with `.groups` argument)

Who the top donors by party among individuals?

contributions.individuals %>% 
  group_by(contributor_name, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` regrouping output by 'contributor_name' (override with `.groups` argument)

How much money has been contributed to each office (primary and general) by individuals?

contributions.individuals %>% 
  group_by(office, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` regrouping output by 'office' (override with `.groups` argument)

How much money has been contributed to each candidate by individuals?

contributions.individuals %>% 
  group_by(ballotName, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` regrouping output by 'ballotName' (override with `.groups` argument)

How much money has been contributed to each general election candidate by individuals?

contributions.individuals %>%
  filter(inGeneral == 1) %>% 
  group_by(ballotName) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` ungrouping output (override with `.groups` argument)

How many people donated to multiple candidates?


contributions.individuals %>% 
  select(
    contributor_name, committee
  ) %>% 
  distinct() %>% 
  group_by(contributor_name) %>%
  summarise(numCandidates = n()) %>% 
  ungroup() %>% 
  group_by(numCandidates) %>% 
  summarise(group_count = n()) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` ungrouping output (override with `.groups` argument)
`summarise()` ungrouping output (override with `.groups` argument)

How many people donated to candidates from both parties?

contributions.individuals %>% 
  select(
    contributor_name, party 
  ) %>% 
  distinct() %>% 
  group_by(contributor_name) %>%
  summarise(numParties = n()) %>% 
  ungroup() %>% 
  group_by(numParties) %>% 
  summarise(group_count = n()) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` ungrouping output (override with `.groups` argument)
`summarise()` ungrouping output (override with `.groups` argument)

How much money John Carney and Julianne Murray received in donations from individuals

`summarise()` ungrouping output (override with `.groups` argument)

How much money John Carney and Julianne Murray received in donations from PACS, business groups, labor uniions, and non-profit organizations

`summarise()` ungrouping output (override with `.groups` argument)

John Carney and Julianne Murray donations from PACS, business groups, labor uniions, and non-profit organizations broken down

`summarise()` regrouping output by 'receiving_committee' (override with `.groups` argument)

How much money John Carney and Julianne Murray received in donations from individuals, PACS, business groups, labor uniions, and non-profit organizations (This is everything except Candidate Committee, Self (Candidate), Political Committee, , and Dem or Rep National Sub-Committees)

`summarise()` ungrouping output (override with `.groups` argument)

How much did legislative candidates receive?

contributions %>% 
  filter(
    str_detect(office, 'State'),
    contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")
  ) %>% 
  select(
    contributor_name,
    contributor_type,
    contribution_type,
    contribution_amount,
    ballotName
  ) %>% 
  mutate(
    contributor_type_group = case_when(
      contributor_type %in% c("Individual","Total of Contributions not exceeding $100") ~ 'individual',
      contributor_type == 'Candidate Committee' ~ 'Candidate Committee',
      contributor_type %in% outside_groups ~ 'outside group',
      contributor_type == 'Self (Candidate)' ~ 'self',
      TRUE ~ 'other'
    )
  ) %>% 
  group_by(
    ballotName,
    contributor_type_group
  ) %>% 
  summarise(
    total = round(sum(contribution_amount), 0)
  ) %>%
  pivot_wider(
    id_cols = ballotName,
    names_from = contributor_type_group,
    values_from = total
  ) %>%
  mutate(
    total = round(sum(c(individual, `Candidate Committee`, `outside group`, other, self), na.rm=T), 0)
  ) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
`summarise()` regrouping output by 'ballotName' (override with `.groups` argument)
---
title: "R Notebook"
output: html_notebook
---

### Document set-up

#### 1.) Import data and format data
```{r echo = T, results = 'hide'}
library(tidyverse)
library(lubridate)
library(DT)
library(stringr)

'%!in%' <- function(x,y)!('%in%'(x,y))

# Set working directory to file location
setwd("~/Documents/GitHub/2020-10-campaign-contributions/workspace")

#import candidates from primary and general
candidates <- read_csv('data/candidates.csv')

#candidates not on ballot
not_on_ballot <- read_csv('committees_not_on_ballot.csv')


# import 2020 contributions from individuals to state races.
contributions.raw <- read_csv('data/all_contributions_2020.csv')
  
# convert names to snake_case
colnames(contributions.raw) <- gsub(' ', '_', tolower(colnames(contributions.raw)))

contributions.noParty <- contributions.raw %>% 
    mutate(contribution_date = as.Date(contribution_date, format='%m/%d/%Y') )  %>% 
    # removes records where office is NA, leaving only contributions to committees supporting candidates
    # removes candidate laons
    filter(
      !is.na(office),
      contribution_type != 'Candidate Loan'
    )


# join party data from candidate list
contributions <- left_join(
  contributions.noParty %>% 
    filter(
      receiving_committee %!in% not_on_ballot$committee
    ) %>% 
    mutate(
      committeeJoin = gsub(' ','', receiving_committee)
    ),
  candidates %>% 
    select(committee, party, ballotName, inGeneral) %>% 
    mutate(
      committeeJoin = gsub(' ','', committee)
    ),
  by = 'committeeJoin'
) %>% 
  filter(!is.na(party)) %>%
  select(-filing_period) %>% 
  distinct()
# original      17,704
# not on ballot 17,311
# no party join 17,117
# distinct      15,873











contributions.individuals <- contributions %>% 
  filter(
      contributor_type %in% c('Individual', "Total of Contributions not exceeding $100"),
      contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")
    )

```


***


### Data overview


| key           | value  |
|---------------|--------|
| **contributions**      | all non-candidate-loan contributions to any candidate committee (where <br/>`is.na(Office)`<br/>`& contribution_type != 'Candidate Loan'` ) |
| **contributions.individuals**      | direct monetary contributions from individuals to any candidate committee (where <br/>`contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")`<br>`& is.na(Office)`<br>`& contributor_type == 'Individual'`<br> ) |
| candidates | all candidates in the Delaware primary and general elections |
| contributions.raw      | all contributions to any committee |


 


```{r echo=FALSE, include=FALSE, results = 'hide'}
contributions.individuals %>%
  group_by(
    contribution_date
  ) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  ggplot(
    aes(x = contribution_date, y=total)
  ) +
  geom_col() +
  labs(title='Daily contributions, all candidates')

```


```{r echo=FALSE, include=FALSE, results = 'hide'}

contributions.individuals %>% 
  group_by(
    party,
    contribution_date
  ) %>%
  summarise(total = sum(contribution_amount)) %>%
  mutate(cum_total = cumsum(total)) %>% 
  ggplot(
    aes(x = contribution_date, y=cum_total, color=party)
  ) +
  geom_line() +
  labs(title='Cumulative contributions, by party')

```



***

## Questions

### *Total*

### How much money has been contributed total?
```{r echo=FALSE}
contributions %>% 
  summarise(total = sum(contribution_amount))
```

### What groups or individuals are the top donors to each party?

```{r echo=FALSE}
contributions %>% 
  filter(contributor_name != 'Total of Contributions not exceeding $100') %>% 
  group_by(contributor_name, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```


### What groups or people donated to candidates from both parties?

```{r echo=FALSE}
contributions %>%
  filter(contributor_name != 'Total of Contributions not exceeding $100') %>% 
  select(
    contributor_name, party
  ) %>% 
  distinct() %>% 
  group_by(contributor_name) %>%
  summarise(numParties = n()) %>% 
  filter( numParties > 1) %>% 
  arrange(desc(numParties)) %>% 
  datatable(options = list(pageLength = 10))

```



### Contributions where `contributor_name` contains "Police"
```{r echo=FALSE}
contributions %>% 
  filter(grepl("Police", contributor_name, ignore.case=TRUE)) %>% 
  datatable(options = list(pageLength = 10))
  
```



### *Individuals*

### How much money has been contributed by individuals total?
```{r echo=FALSE}
contributions.individuals %>% 
  summarise(total = sum(contribution_amount))
```

### How much money has been contributed by individuals to each party
```{r}
contributions.individuals %>% 
  group_by(party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  datatable(options = list(pageLength = 10))
```

### Who the top donors among individuals?

```{r}
contributions.individuals %>% 
  group_by(contributor_name) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```

### Who the top donors by party among individuals?

```{r}
contributions.individuals %>% 
  group_by(contributor_name, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```

### How much money has been contributed to each office (primary and general) by individuals?
```{r}
contributions.individuals %>% 
  group_by(office, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```

### How much money has been contributed to each candidate by individuals?
```{r}
contributions.individuals %>% 
  group_by(ballotName, party) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```


### How much money has been contributed to each general election candidate by individuals?
```{r}
contributions.individuals %>%
  filter(inGeneral == 1) %>% 
  group_by(ballotName) %>% 
  summarise(total = sum(contribution_amount)) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```
### How many people donated to multiple candidates?
```{r}

contributions.individuals %>% 
  select(
    contributor_name, committee
  ) %>% 
  distinct() %>% 
  group_by(contributor_name) %>%
  summarise(numCandidates = n()) %>% 
  ungroup() %>% 
  group_by(numCandidates) %>% 
  summarise(group_count = n()) %>% 
  datatable(options = list(pageLength = 10))


```


### How many people donated to candidates from both parties?

```{r}
contributions.individuals %>% 
  select(
    contributor_name, party 
  ) %>% 
  distinct() %>% 
  group_by(contributor_name) %>%
  summarise(numParties = n()) %>% 
  ungroup() %>% 
  group_by(numParties) %>% 
  summarise(group_count = n()) %>% 
  datatable(options = list(pageLength = 10))

```


***

```{r include=FALSE}

outside_groups <- c("Out-of-State or Federal Committee","Individual", "Business/Group/Organization", "Political Action Committee", "Labor Union", "Non-Profit Organization")

carney_murray_group <- contributions %>% 
  filter(
      contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100"),
      contributor_type %in% outside_groups,
      receiving_committee %in% c('Friends for John Carney', 'Murray for Delaware')
      # contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")
    )
```



### How much money John Carney and Julianne Murray received in donations from individuals
```{r echo=FALSE}
carney_murray_group %>%
  filter(contributor_type %in% c("Individual","Total of Contributions not exceeding $100")) %>% 
  group_by(receiving_committee) %>% 
  summarise(total = sum(contribution_amount) )
```

### How much money John Carney and Julianne Murray received in donations from PACS, business groups, labor uniions, and non-profit organizations
```{r echo=FALSE}
carney_murray_group %>%
  filter(contributor_type %!in% c("Individual","Total of Contributions not exceeding $100")) %>% 
  group_by(receiving_committee) %>% 
  summarise(total = sum(contribution_amount) )
```

### John Carney and Julianne Murray donations from PACS, business groups, labor uniions, and non-profit organizations broken down
```{r echo=FALSE}
carney_murray_group %>%
  filter(contributor_type %!in% c("Individual","Total of Contributions not exceeding $100")) %>% 
  group_by(receiving_committee, contributor_name) %>% 
  summarise(total = sum(contribution_amount) ) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))
```


### How much money John Carney and Julianne Murray received in donations from individuals, PACS, business groups, labor uniions, and non-profit organizations (This is everything except Candidate Committee, Self (Candidate), Political Committee, , and Dem or Rep National Sub-Committees)
```{r echo=FALSE}
carney_murray_group %>%
  group_by(receiving_committee) %>% 
  summarise(total = sum(contribution_amount) )
```



***
### How much did legislative candidates receive?

```{r}

contributions %>% 
  filter(
    str_detect(office, 'State'),
    contribution_type %in% c("Check", "Electronic Fund Transfer", "Credit Card", "Cash", "Total of Contributions not exceeding $100")
  ) %>% 
  select(
    contributor_name,
    contributor_type,
    contribution_type,
    contribution_amount,
    ballotName
  ) %>% 
  mutate(
    contributor_type_group = case_when(
      contributor_type %in% c("Individual","Total of Contributions not exceeding $100") ~ 'individual',
      contributor_type == 'Candidate Committee' ~ 'Candidate Committee',
      contributor_type %in% outside_groups ~ 'outside group',
      contributor_type == 'Self (Candidate)' ~ 'self',
      TRUE ~ 'other'
    )
  ) %>% 
  group_by(
    ballotName,
    contributor_type_group
  ) %>% 
  summarise(
    total = round(sum(contribution_amount), 0)
  ) %>%
  pivot_wider(
    id_cols = ballotName,
    names_from = contributor_type_group,
    values_from = total
  ) %>%
  mutate(
    total = round(sum(c(individual, `Candidate Committee`, `outside group`, other, self), na.rm=T), 0)
  ) %>% 
  arrange(desc(total)) %>% 
  datatable(options = list(pageLength = 10))


```



