library(tidyverse)
data <- read_csv("youtube.csv")
Rows: 130390 Columns: 16
── Column specification ────────────────────────────────────────────────────────────────────────────────────────
Delimiter: ","
chr  (7): video_id, title, channelId, channelTitle, tags, thumbnail_link, description
dbl  (5): categoryId, view_count, likes, dislikes, comment_count
lgl  (2): comments_disabled, ratings_disabled
dttm (2): publishedAt, trending_date

ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
data <- unique(data)

General

Data

data

Like/Dislike ratios

head(data$likes / data$dislikes)
[1]  26.79898  52.51933 134.62215  12.52748  47.51245 103.86997
mean(head(data$likes / data$dislikes, n=1000))
[1] 67.98741

Most disliked

videos <- data %>%
  arrange(dislikes)
tail(videos, n=1)

Most Common

videos <- data %>%
  arrange(view_count)
tail(videos, n=1)

Spam checking

Comments

Videos with lots of comments are likely filled of spam.

Music videos for some reason keeps getting hit in the data, so let’s exclude it.

Big channels are showing up, lets limit the view count

This part of the report is not useful

videos <- data %>%
  filter(categoryId != 10) %>%
  filter(view_count < 100000) %>%
  filter(!comments_disabled) %>%
  select(title, comment_count) %>%
  arrange(comment_count)
tail(videos, n = 16)

Gaming

Everyone loves gaming, including me, so lets find some info about that. Gaming videos are popular, so we should find some results

Minecraft

Everyone loves MC.

videos <- data %>%
  filter(categoryId == 20) %>%
  filter(grepl("Minecraft", title))
videos
LS0tDQp0aXRsZTogIllvdXR1YmUgRURBIg0Kb3V0cHV0OiBodG1sX25vdGVib29rDQotLS0NCg0KYGBge3Igc2V0dXB9DQpsaWJyYXJ5KHRpZHl2ZXJzZSkNCmRhdGEgPC0gcmVhZF9jc3YoInlvdXR1YmUuY3N2IikNCmRhdGEgPC0gdW5pcXVlKGRhdGEpDQpgYGANCg0KIyBHZW5lcmFsDQoNCiMjIERhdGENCg0KYGBge3J9DQpkYXRhDQpgYGANCg0KIyMgTGlrZS9EaXNsaWtlIHJhdGlvcw0KDQpgYGB7cn0NCmhlYWQoZGF0YSRsaWtlcyAvIGRhdGEkZGlzbGlrZXMpDQptZWFuKGhlYWQoZGF0YSRsaWtlcyAvIGRhdGEkZGlzbGlrZXMsIG49MTAwMCkpDQpgYGANCg0KIyMgTW9zdCBkaXNsaWtlZA0KDQpgYGB7cn0NCnZpZGVvcyA8LSBkYXRhICU+JQ0KICBhcnJhbmdlKGRpc2xpa2VzKQ0KdGFpbCh2aWRlb3MsIG49MSkNCmBgYA0KDQojIyBNb3N0IENvbW1vbg0KDQpgYGB7cn0NCnZpZGVvcyA8LSBkYXRhICU+JQ0KICBhcnJhbmdlKHZpZXdfY291bnQpDQp0YWlsKHZpZGVvcywgbj0xKQ0KYGBgDQoNCiMgU3BhbSBjaGVja2luZw0KDQojIyBDb21tZW50cw0KDQpWaWRlb3Mgd2l0aCBsb3RzIG9mIGNvbW1lbnRzIGFyZSBsaWtlbHkgZmlsbGVkIG9mIHNwYW0uDQoNCk11c2ljIHZpZGVvcyBmb3Igc29tZSByZWFzb24ga2VlcHMgZ2V0dGluZyBoaXQgaW4gdGhlIGRhdGEsIHNvIGxldCdzIGV4Y2x1ZGUgaXQuDQoNCkJpZyBjaGFubmVscyBhcmUgc2hvd2luZyB1cCwgbGV0cyBsaW1pdCB0aGUgdmlldyBjb3VudA0KDQpUaGlzIHBhcnQgb2YgdGhlIHJlcG9ydCBpcyBub3QgdXNlZnVsDQoNCmBgYHtyfQ0KdmlkZW9zIDwtIGRhdGEgJT4lDQogIGZpbHRlcihjYXRlZ29yeUlkICE9IDEwKSAlPiUNCiAgZmlsdGVyKHZpZXdfY291bnQgPCAxMDAwMDApICU+JQ0KICBmaWx0ZXIoIWNvbW1lbnRzX2Rpc2FibGVkKSAlPiUNCiAgc2VsZWN0KHRpdGxlLCBjb21tZW50X2NvdW50KSAlPiUNCiAgYXJyYW5nZShjb21tZW50X2NvdW50KQ0KdGFpbCh2aWRlb3MsIG4gPSAxNikNCmBgYA0KDQojIEdhbWluZw0KDQpFdmVyeW9uZSBsb3ZlcyBnYW1pbmcsIGluY2x1ZGluZyBtZSwgc28gbGV0cyBmaW5kIHNvbWUgaW5mbyBhYm91dCB0aGF0LiBHYW1pbmcgdmlkZW9zIGFyZSBwb3B1bGFyLCBzbyB3ZSBzaG91bGQgZmluZCBzb21lIHJlc3VsdHMNCg0KIyMgTWluZWNyYWZ0DQpFdmVyeW9uZSBsb3ZlcyBNQy4NCg0KYGBge3J9DQp2aWRlb3MgPC0gZGF0YSAlPiUNCiAgZmlsdGVyKGNhdGVnb3J5SWQgPT0gMjApICU+JQ0KICBmaWx0ZXIoZ3JlcGwoIk1pbmVjcmFmdCIsIHRpdGxlKSkNCnZpZGVvcw0KYGBg