Randonly fetch threads from subReddit, r/politics; r/PoliticalHumor; r/PoliticalDiscussion, where they are in top 10 pages of each subrredit’s search result - Search date: Apr 2nd, 2021
#top 20 pages of threads in r/politics, searched on Apr 2nd, 2021 and remove duplicate by each comment
#politics <- get_reddit(search_terms = "China", subreddit = "politics", cn_threshold = 10, sort_by = "comments", page_threshold = 1)
#politics_1 <- get_reddit(search_terms = "Chinese", subreddit = "politics", cn_threshold = 10, sort_by = "comments", page_threshold = 1)
#keyword_china_1 <- rbind(politics,politics_1)
#keyword_china_1 <- keyword_china_1 %>% distinct(comment, .keep_all= TRUE)
#write.csv(keyword_china_1,"keyword_china_1.csv", row.names = TRUE)
#top 10 pages of threads in r/PoliticalHumor, searched on Apr 2nd, 2021 and remove duplicate by each comment
#PoliticalHumor <- get_reddit(search_terms = "China", subreddit = "PoliticalHumor", cn_threshold = 10, sort_by = "comments", page_threshold = 1)
#PoliticalHumor_1 <- get_reddit(search_terms = "Chinese", subreddit = "PoliticalHumor", cn_threshold = 10, sort_by = "comments", page_threshold = 1)
#keyword_china_2 <- rbind(PoliticalHumor,PoliticalHumor_1)
#keyword_china_2 <- keyword_china_2 %>% distinct(comment, .keep_all= TRUE)
#write.csv(keyword_china_2,"keyword_china_2.csv", row.names = TRUE)
#top 10 pages of threads in r/PoliticalDiscussion, searched on Apr 2nd, 2021 and remove duplicate by each comment
#PoliticalDiscussion <- get_reddit(search_terms = "China", subreddit = "PoliticalDiscussion", cn_threshold = 10, sort_by = "comments", page_threshold = 1)
#PoliticalDiscussion_1 <- get_reddit(search_terms = "Chinese", subreddit = "PoliticalDiscussion", cn_threshold = 10, sort_by = "comments", page_threshold = 1)
#keyword_china_3 <- rbind(PoliticalDiscussion,PoliticalDiscussion_1)
#keyword_china_3 <- keyword_china_3 %>% distinct(comment, .keep_all= TRUE)
#write.csv(keyword_china_3,"keyword_china_3.csv", row.names = TRUE)
#combine data from three subreddits into one
#keyword_china_combine <- rbind(keyword_china_1,keyword_china_2,keyword_china_3)
#remove NA value in the comment column
#keyword_china_combine <- keyword_china_combine %>% drop_na(comment)
#keyword_china_combine <- keyword_china_combine %>% drop_na(comm_date)
#keyword_china_combine <- keyword_china_combine %>% drop_na(post_date)
#write.csv(keyword_china_combine,"keyword_china_combine.csv", row.names = TRUE)
#saveRDS(keyword_china_combine, file = "keyword_china_combine.rds")
keyword_china_combine <- readRDS(file = "keyword_china_combine.rds")