Q1

q1  <- movies %>%  
  rename(movie_title = Film , release_year = Year)

print(head(q1))

Q2

selected_movies <- q1 %>%
  select(movie_title, release_year, Genre, Profitability)

print(selected_movies)

Q3

filtered_movies <- movies %>%
  filter(Year > 2000, `Rotten Tomatoes %` > 80)

print(filtered_movies)

Q4

movies_with_profitability <- movies %>%
  mutate(Profitability_millions = Profitability * 1000000)

print(movies_with_profitability)

Q5

sorted_movies <- movies_with_profitability %>%
  arrange(desc(`Rotten Tomatoes %`), desc(Profitability_millions))

print(sorted_movies)

Q6

final_dataframe <- movies %>%
  rename(
    movie_title = Film,
    release_year = Year
  ) %>%
  filter(release_year > 2000, `Rotten Tomatoes %` > 80) %>%
  mutate(Profitability_millions = Profitability * 1000000) %>%
  arrange(desc(`Rotten Tomatoes %`), desc(Profitability_millions))

print(final_dataframe)

Q7

# while some of the movies with high rotten tomatoes % have high audience score %, 
# there are also movies with low rotten tomatoes % and high audience score (like twilight)
# some also have high rotten tomatoes % and low audience score % (rachel getting married)

Extra Credit

summary_dataframe <- movies %>%
  rename(
    movie_title = Film,
    release_year = Year
  ) %>%
  mutate(Profitability_millions = Profitability * 1000000) %>%
  group_by(Genre) %>%
  summarize(
    average_rating = mean(`Rotten Tomatoes %`, na.rm = TRUE),
    average_profitability = mean(Profitability_millions, na.rm = TRUE)
  )

  print(summary_dataframe)