Assignment Week 10

Including Plots

You can also embed plots, for example:

nrc_joy <- get_sentiments("nrc") %>% 
  filter(sentiment == "joy")

tidy_books %>%
  filter(book == "Emma") %>%
  inner_join(nrc_joy) %>%
  count(word, sort = TRUE)

## Joining with `by = join_by(word)`

## # A tibble: 301 × 2
##    word          n
##    <chr>     <int>
##  1 good        359
##  2 friend      166
##  3 hope        143
##  4 happy       125
##  5 love        117
##  6 deal         92
##  7 found        92
##  8 present      89
##  9 kind         82
## 10 happiness    76
## # ℹ 291 more rows

Note that the echo = FALSE parameter was added to the code chunk to prevent printing of the R code that generated the plot.

jane_austen_sentiment <- tidy_books %>%
  inner_join(get_sentiments("bing"))  |> 
  count(book, index = linenumber %/% 80, sentiment) |>
  pivot_wider(names_from = sentiment, values_from =n, values_fill = 0) |>
  mutate(sentiment = positive - negative)

## Joining with `by = join_by(word)`

## Warning in inner_join(., get_sentiments("bing")): Detected an unexpected many-to-many relationship between `x` and `y`.
## ℹ Row 435434 of `x` matches multiple rows in `y`.
## ℹ Row 5051 of `y` matches multiple rows in `x`.
## ℹ If a many-to-many relationship is expected, set `relationship =
##   "many-to-many"` to silence this warning.

pride_prejudice <- tidy_books |>
                   filter(book == "Pride & Prejudice")

afinn <- pride_prejudice |>
         inner_join(get_sentiments("afinn")) |>
         group_by(index = linenumber %/% 80) |>
         summarise(sentiment = sum(value)) |>
         mutate(method = "AFINN")

## Joining with `by = join_by(word)`

bing_and_nrc <- bind_rows(
  pride_prejudice |>
    inner_join(get_sentiments("bing"))|>
    mutate(method = "Bing et al."),
  pride_prejudice |> 
    inner_join(get_sentiments("nrc") |>
                 filter(sentiment %in% c("positive",
                                          "negative"))
    ) |>
    mutate(method = "NRC")) |>
    count(method, index = linenumber %/% 80, sentiment) |>
  pivot_wider(names_from = sentiment,
              values_from = n,
              values_fill = 0) |>
  mutate(sentiment = positive - negative)

## Joining with `by = join_by(word)`
## Joining with `by = join_by(word)`

## Warning in inner_join(pride_prejudice, filter(get_sentiments("nrc"), sentiment %in% : Detected an unexpected many-to-many relationship between `x` and `y`.
## ℹ Row 215 of `x` matches multiple rows in `y`.
## ℹ Row 5178 of `y` matches multiple rows in `x`.
## ℹ If a many-to-many relationship is expected, set `relationship =
##   "many-to-many"` to silence this warning.

book_lines <- tidy_books |>
                   filter(book == "Pride & Prejudice")

sents <- c("positive", "negative")
lou_and_nrc <- bind_rows(
  book_lines |>
    inner_join(get_sentiments("nrc")) |>
    filter(sentiment %in% sents ),
  book_lines |>
    inner_join(get_sentiments("loughran")) |>
    filter(sentiment %in% sents )
) |> 
  group_by(book, chapter, sentiment) |>
  summarise(n = n()) |>
   pivot_wider(names_from = sentiment,
              values_from = n,
              values_fill = 0) |>
  mutate(sentiment = positive - negative)

## Joining with `by = join_by(word)`

## Warning in inner_join(book_lines, get_sentiments("nrc")): Detected an unexpected many-to-many relationship between `x` and `y`.
## ℹ Row 1 of `x` matches multiple rows in `y`.
## ℹ Row 12737 of `y` matches multiple rows in `x`.
## ℹ If a many-to-many relationship is expected, set `relationship =
##   "many-to-many"` to silence this warning.

## Joining with `by = join_by(word)`

## Warning in inner_join(book_lines, get_sentiments("loughran")): Detected an unexpected many-to-many relationship between `x` and `y`.
## ℹ Row 3 of `x` matches multiple rows in `y`.
## ℹ Row 2826 of `y` matches multiple rows in `x`.
## ℹ If a many-to-many relationship is expected, set `relationship =
##   "many-to-many"` to silence this warning.

## `summarise()` has grouped output by 'book', 'chapter'. You can override using
## the `.groups` argument.

book_lines |>
  filter(chapter == 36) |>
  count(word) |>
  wordcloud2(size = 1.5)

Assignment Week 10

Jonathan Cruz

2024-03-31

Including Plots