install.packages(“robotstxt”)

library(robotstxt)

url <- “https://en.wikipedia.org/wiki/2024_in_film” paths_allowed(url)

is_allowed <- paths_allowed(url)

library(rvest)

url <- “https://en.wikipedia.org/wiki/2024_in_film

webpage <- read_html(url)

tables <- html_nodes(webpage, “table”)

film_tables <- lapply(tables, html_table, fill = TRUE)

highest_grossing <- film_tables[[1]] head(highest_grossing)