library(RMySQL)
## Loading required package: DBI
dbuser <- 'data607'
dbpassword <- 'password1!'
db_name <- 'movies'
db_table <- 'rankings'
db_host <- '127.0.0.1'
db_port <- 3306
mydb <- dbConnect(MySQL(), user = dbuser, password = dbpassword, dbname = db_name, host = db_host, port = db_port)
rs = dbSendQuery(mydb, "select * from rankings")
data = fetch(rs, n=-1)
data_rows = nrow(data)
dumbo_scores <- na.omit(data[, "dumbo_2019"])
dumbo_seen <- length(dumbo_scores)
aladdin_scores <- na.omit(data[, "aladdin_2019"])
aladdin_seen <- length(aladdin_scores)
lionking_scores <- na.omit(data[, "lionking_2019"])
lionking_seen <- length(lionking_scores)
toystory4_scores <- na.omit(data[, "toystory4"])
toystory4_seen <- length(toystory4_scores)
ralphbreaks_scores <- na.omit(data[, "ralphbreaks"])
ralphbreaks_seen <- length(ralphbreaks_scores)
incredible2_scores <- na.omit(data[, "incredibles2"])
incredible2_seen <- length(incredible2_scores)
titles <- c("Dumbo(2019)","Aladdin(2019)","The Lion King (2019)","Toy Story 4","Ralph Breaks The Internet","The Incredibles 2")
perc_seen <- c((dumbo_seen/data_rows),(aladdin_seen/data_rows),(lionking_seen/data_rows),(toystory4_seen/data_rows),(ralphbreaks_seen/data_rows),(incredible2_seen/data_rows))
avg_score <- c(mean(dumbo_scores),mean(aladdin_scores),mean(lionking_scores),mean(toystory4_scores),mean(ralphbreaks_scores),mean(incredible2_scores))
calc_df <- data.frame("Movie Titles" = titles, "Percentage Seen" = perc_seen, "Avg Score" = avg_score)
print(calc_df)
Movie.Titles Percentage.Seen Avg.Score
1 Dumbo(2019) 0.6666667 3.250000 2 Aladdin(2019) 0.8333333 3.800000 3 The Lion King (2019) 0.6666667 3.500000 4 Toy Story 4 0.8333333 3.800000 5 Ralph Breaks The Internet 0.6666667 4.500000 6 The Incredibles 2 1.0000000 4.166667
barplot(calc_df$Avg.Score, names = calc_df$Movie.Titles, main="Avg Score of Movies", xlab="Movie", las=2)
pie(c(dumbo_seen,(data_rows-dumbo_seen)), labels = c("Seen Dumbo","Did Not See Dumbo"), main="Survey Takers Who Saw Dumbo (2019)")
pie(c(toystory4_seen,(data_rows-toystory4_seen)), labels = c("Seen Toy Story 4","Did Not See Toy Story 4"), main="Survey Takers Who Saw Toy Story 4")