How to create advanced plots

Wordcloud

# load Packages
require(RColorBrewer)

## Loading required package: RColorBrewer

require(tidyverse)

## Loading required package: tidyverse

## ── Attaching packages ─────────────────────────────────────── tidyverse 1.3.1 ──

## ✔ tibble  3.1.6     ✔ dplyr   1.0.8
## ✔ tidyr   1.2.0     ✔ stringr 1.4.0
## ✔ readr   2.1.2     ✔ forcats 0.5.1
## ✔ purrr   0.3.4

## ── Conflicts ────────────────────────────────────────── tidyverse_conflicts() ──
## ✖ dplyr::filter() masks stats::filter()
## ✖ dplyr::lag()    masks stats::lag()

require(magrittr)

## Loading required package: magrittr

## 
## Attaching package: 'magrittr'

## The following object is masked from 'package:purrr':
## 
##     set_names

## The following object is masked from 'package:tidyr':
## 
##     extract

require(ggwordcloud)

## Loading required package: ggwordcloud

library(SnowballC)
library(tm)

## Loading required package: NLP

## 
## Attaching package: 'NLP'

## The following object is masked from 'package:ggplot2':
## 
##     annotate

# load text data using a filter() function from dplyr package
# devtools::install_github("JohnCoene/sacred")
scripture = sacred::king_james_version

john = scripture %>% 
  filter(book == "joh")%>% 
  select(text)

# transforming the text document into corpus
john.corpus = john %>% 
  tm::VectorSource() %>% 
  tm::VCorpus()

# replacing special characters to space
toSpace = content_transformer(function (x , pattern ) 
  gsub(pattern, " ", x))

john.corpus = john.corpus %>% 
  tm_map(toSpace, "/") %>%
  tm_map(toSpace, " ") %>%
  tm_map(toSpace, "\\|")

# removing stopwords and change all words to small letters
john.corpus =  john.corpus %>% 
  tm_map(FUN = content_transformer(tolower)) %>% # Convert the text to lower case
  tm_map(FUN = removeNumbers) %>% # Remove numbers
  tm_map(removeWords, stopwords("english")) %>% # Remove english common stopwords
  tm_map(removeWords, c("ye", "O", "unto", "yet", "thee", "wherein", "neither", "shall", 
                        "saith", "host", "will", "offer", "say")) %>%   # Remove words
  tm_map(removePunctuation) %>%   # Remove punctuations
  tm_map(stripWhitespace)   #

 

# compute the frequency of each word
# changed from corpus format to matrix and to data.frame
john.corpus.tb=  john.corpus %>% 
  tm::TermDocumentMatrix(control = list(removeNumbers = TRUE,
                                        stopwords = TRUE,
                                        stemming = TRUE)) %>% 
  as.matrix() %>% as.data.frame() %>% 
  tibble::rownames_to_column() %>%
  dplyr::rename(word = 1, freq = 2) %>%
  dplyr::arrange(desc(freq))


# make the word cloud 
john.corpus.tb[1,1]="Yeshua"

set.seed(42)
ggplot(
  john.corpus.tb,
  aes(
    label = word, size = freq,
    color =  (freq)
  )
) +
  geom_text_wordcloud_area(aes(angle = 45 * sample(-2:2, nrow(john.corpus.tb),
                                                   replace = TRUE,
                                                   prob = c(1, 1, 4, 1, 1)
  )),
  mask = png::readPNG("C:\\Users\\hed2\\Downloads\\mask.png"
  ),
  rm_outside = TRUE
  ) +
  scale_size_area(max_size = 20) +
  theme_minimal() +
  # scale_color_brewer(palette = "Paired", direction = -1)
  scale_color_gradient(low = "blue", high = "darkred")

## Some words could not fit on page. They have been removed.

Map using shinyapps.io

Map

(click here)[https://pl8ev5-dian-he.shinyapps.io/map_x/]

GIF using PPT

Starry sky

Fish

How to create advanced plots

Daniel

9-12-2022

How to create advanced plots

Animated chart

Wordcloud

Map using shinyapps.io

GIF using PPT