1. Scrape the table tall buildings (300m+) currently under construction from https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world Table: Denotes building that is or was once the tallest in the world.
url <-  "https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world"
 h <- read_html(url)
 tab <- h %>% html_nodes("table")
 tab <- tab[[2]] %>% html_table
#tab <- tab %>% setNames(c("Rank", "Name","Image" , "City","Country","Height (m)", "Height (ft)"  ,"Floors", "Years" , "Notes"))

names(tab) <- tab[1,]
tab <- tab[-1,]

tab
  1. Scrape the table tall buildings (300m+) currently under construction from https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world Table: Denotes building with pinnacle height higher than architectural.
url <-  "https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world"
 h <- read_html(url)
 tab <- h %>% html_nodes("table")
 tab <- tab[[4]] %>% html_table
tab <- tab %>% setNames(c("Rank", "Building", "City" ,"Country", "Height (m)", "Height (ft)", "Floors" ,"Built"))
tab
  1. Scrape the table tall buildings (300m+) currently under construction from https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world Table: Height to occupied floor
url <-  "https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world"
 h <- read_html(url)
 tab <- h %>% html_nodes("table")
 tab <- tab[[5]] %>% html_table
tab <- tab %>% setNames(c("Rank", "Building", "City" ,"Country", "Height ", "Floors" ,"Built"))
tab
  1. Scrape the table tall buildings (300m+) currently under construction from https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world Table: Buildings under construction
url <-  "https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world"
 h <- read_html(url)
 tab <- h %>% html_nodes("table")
 tab <- tab[[6]] %>% html_table
tab <- tab %>% setNames(c("Building", "Planned architectural height", "Floors", "Planned completion" 
                           ,   "Country", "City" , "Ref."))
tab
  1. Scrape the table tall buildings (300m+) currently under construction from https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world Table: List by continent
url <-  "https://en.wikipedia.org/wiki/List_of_tallest_buildings_in_the_world"
 h <- read_html(url)
 tab <- h %>% html_nodes("table")
 tab <- tab[[7]] %>% html_table
tab <- tab %>% setNames(c("Countinent", "Building", "height" , "Floors Count", "Completed" ,   "Country", "City" ))
tab
  1. Scrape the table for editorial-board-members from http://www.ijeais.org/ijeais/index.php/editorial-board-members/
url <-  "http://www.ijeais.org/ijeais/index.php/editorial-board-members/"
 h <- read_html(url)
 tab <- h %>% html_nodes("table")
 tab <- tab[[1]] %>% html_table
tab <- tab %>% setNames(c("Name","Branch","Institution/Affiliation","Country" ))
tab
  1. Scrap titles from this webpage https://www.imdb.com/search/title/?title_type=feature&num_votes=25000,&genres=adventure
 html_Content <- read_html("https://www.imdb.com/search/title/?title_type=feature&num_votes=25000,&genres=adventure") 
  
titles <-  html_Content %>% html_nodes(".lister-item-header") %>% html_node("a") %>%
    html_text()

library(stringr)
titles <- str_replace_all(titles, "[\r\n]" , "")
titles <- str_replace_all(titles, " " , "")


titles_data <- class.df<- data.frame(titles)
titles_data
  1. Scrap Years from this webpage https://www.imdb.com/search/title/?title_type=feature&num_votes=25000,&genres=adventure
 
years <-  html_Content %>% html_nodes(".lister-item-year") %>%
    html_text()


  years_data <- class.df<- data.frame(years)
years_data
  1. Scrap Ratings from this webpage https://www.imdb.com/search/title/?title_type=feature&num_votes=25000,&genres=adventure
 
 
ratings <-  html_Content %>% html_nodes(".ratings-imdb-rating") %>%
    html_text()

ratings <- str_replace_all(ratings, "[\r\n]" , "")
ratings <- str_replace_all(ratings, " " , "")

  ratings_data <- class.df<- data.frame(ratings)
ratings_data
  1. Scrap the synopsis of the movies from this webpage https://www.imdb.com/search/title/?title_type=feature&num_votes=25000,&genres=adventure Use: .ratings-bar+ .text-muted
synopsis <-  html_Content %>% html_nodes(".ratings-bar+ .text-muted") %>%
    html_text()

synopsis <- str_replace_all(synopsis, "[\r\n]" , "")
synopsis <- str_replace_all(synopsis, " " , "")

synopsis_data <- class.df<- data.frame(synopsis)
synopsis_data
NA
  1. Create a data frame using our variables as a column from #7…..#10
complete_data <- class.df<- data.frame(titles , years ,ratings ,  synopsis )
complete_data
NA
LS0tDQp0aXRsZTogIkludHJvZHVjdGlvbiB0byBEYXRhIFNjaWVuY2UgSG9tZXdvcmsxIg0Kb3V0cHV0OiBodG1sX25vdGVib29rDQotLS0NCg0KDQpgYGB7ciB3YXJuaW5nPUZBTFNFLGVjaG89RkFMU0V9DQpsaWJyYXJ5KHJ2ZXN0KQ0KDQpgYGANCg0KDQoqDQoxLiBTY3JhcGUgdGhlIHRhYmxlIHRhbGwgYnVpbGRpbmdzICgzMDBtKykgY3VycmVudGx5IHVuZGVyIGNvbnN0cnVjdGlvbiBmcm9tIGh0dHBzOi8vZW4ud2lraXBlZGlhLm9yZy93aWtpL0xpc3Rfb2ZfdGFsbGVzdF9idWlsZGluZ3NfaW5fdGhlX3dvcmxkDQpUYWJsZTogRGVub3RlcyBidWlsZGluZyB0aGF0IGlzIG9yIHdhcyBvbmNlIHRoZSB0YWxsZXN0IGluIHRoZSB3b3JsZC4NCiogDQpgYGB7ciB3YXJuaW5nPUZBTFNFfQ0KdXJsIDwtICAiaHR0cHM6Ly9lbi53aWtpcGVkaWEub3JnL3dpa2kvTGlzdF9vZl90YWxsZXN0X2J1aWxkaW5nc19pbl90aGVfd29ybGQiDQogaCA8LSByZWFkX2h0bWwodXJsKQ0KIHRhYiA8LSBoICU+JSBodG1sX25vZGVzKCJ0YWJsZSIpDQogdGFiIDwtIHRhYltbMl1dICU+JSBodG1sX3RhYmxlDQojdGFiIDwtIHRhYiAlPiUgc2V0TmFtZXMoYygiUmFuayIsICJOYW1lIiwiSW1hZ2UiICwgIkNpdHkiLCJDb3VudHJ5IiwiSGVpZ2h0IChtKSIsICJIZWlnaHQgKGZ0KSIgICwiRmxvb3JzIiwgIlllYXJzIiAsICJOb3RlcyIpKQ0KDQpuYW1lcyh0YWIpIDwtIHRhYlsxLF0NCnRhYiA8LSB0YWJbLTEsXQ0KDQp0YWINCmBgYA0KIA0KDQoNCg0KKg0KMi4gU2NyYXBlIHRoZSB0YWJsZSB0YWxsIGJ1aWxkaW5ncyAoMzAwbSspIGN1cnJlbnRseSB1bmRlciBjb25zdHJ1Y3Rpb24gZnJvbSBodHRwczovL2VuLndpa2lwZWRpYS5vcmcvd2lraS9MaXN0X29mX3RhbGxlc3RfYnVpbGRpbmdzX2luX3RoZV93b3JsZA0KVGFibGU6IERlbm90ZXMgYnVpbGRpbmcgd2l0aCBwaW5uYWNsZSBoZWlnaHQgaGlnaGVyIHRoYW4gYXJjaGl0ZWN0dXJhbC4NCiogDQpgYGB7cn0NCnVybCA8LSAgImh0dHBzOi8vZW4ud2lraXBlZGlhLm9yZy93aWtpL0xpc3Rfb2ZfdGFsbGVzdF9idWlsZGluZ3NfaW5fdGhlX3dvcmxkIg0KIGggPC0gcmVhZF9odG1sKHVybCkNCiB0YWIgPC0gaCAlPiUgaHRtbF9ub2RlcygidGFibGUiKQ0KIHRhYiA8LSB0YWJbWzRdXSAlPiUgaHRtbF90YWJsZQ0KdGFiIDwtIHRhYiAlPiUgc2V0TmFtZXMoYygiUmFuayIsICJCdWlsZGluZyIsICJDaXR5IiAsIkNvdW50cnkiLCAiSGVpZ2h0IChtKSIsICJIZWlnaHQgKGZ0KSIsICJGbG9vcnMiICwiQnVpbHQiKSkNCnRhYg0KYGBgDQogDQogDQoqDQozLiBTY3JhcGUgdGhlIHRhYmxlIHRhbGwgYnVpbGRpbmdzICgzMDBtKykgY3VycmVudGx5IHVuZGVyIGNvbnN0cnVjdGlvbiBmcm9tIA0KaHR0cHM6Ly9lbi53aWtpcGVkaWEub3JnL3dpa2kvTGlzdF9vZl90YWxsZXN0X2J1aWxkaW5nc19pbl90aGVfd29ybGQNClRhYmxlOiBIZWlnaHQgdG8gb2NjdXBpZWQgZmxvb3INCg0KKiANCmBgYHtyfQ0KdXJsIDwtICAiaHR0cHM6Ly9lbi53aWtpcGVkaWEub3JnL3dpa2kvTGlzdF9vZl90YWxsZXN0X2J1aWxkaW5nc19pbl90aGVfd29ybGQiDQogaCA8LSByZWFkX2h0bWwodXJsKQ0KIHRhYiA8LSBoICU+JSBodG1sX25vZGVzKCJ0YWJsZSIpDQogdGFiIDwtIHRhYltbNV1dICU+JSBodG1sX3RhYmxlDQp0YWIgPC0gdGFiICU+JSBzZXROYW1lcyhjKCJSYW5rIiwgIkJ1aWxkaW5nIiwgIkNpdHkiICwiQ291bnRyeSIsICJIZWlnaHQgIiwgIkZsb29ycyIgLCJCdWlsdCIpKQ0KdGFiDQpgYGANCg0KDQoqDQo0LiBTY3JhcGUgdGhlIHRhYmxlIHRhbGwgYnVpbGRpbmdzICgzMDBtKykgY3VycmVudGx5IHVuZGVyIGNvbnN0cnVjdGlvbiANCmZyb20gaHR0cHM6Ly9lbi53aWtpcGVkaWEub3JnL3dpa2kvTGlzdF9vZl90YWxsZXN0X2J1aWxkaW5nc19pbl90aGVfd29ybGQNClRhYmxlOiAgQnVpbGRpbmdzIHVuZGVyIGNvbnN0cnVjdGlvbg0KKiANCmBgYHtyfQ0KdXJsIDwtICAiaHR0cHM6Ly9lbi53aWtpcGVkaWEub3JnL3dpa2kvTGlzdF9vZl90YWxsZXN0X2J1aWxkaW5nc19pbl90aGVfd29ybGQiDQogaCA8LSByZWFkX2h0bWwodXJsKQ0KIHRhYiA8LSBoICU+JSBodG1sX25vZGVzKCJ0YWJsZSIpDQogdGFiIDwtIHRhYltbNl1dICU+JSBodG1sX3RhYmxlDQp0YWIgPC0gdGFiICU+JSBzZXROYW1lcyhjKCJCdWlsZGluZyIsICJQbGFubmVkIGFyY2hpdGVjdHVyYWwgaGVpZ2h0IiwgIkZsb29ycyIsICJQbGFubmVkIGNvbXBsZXRpb24iIA0KICAgICAgICAgICAgICAgICAgICAgICAgICAgLCAgICJDb3VudHJ5IiwgIkNpdHkiICwgIlJlZi4iKSkNCnRhYg0KYGBgDQoNCioNCjUuIFNjcmFwZSB0aGUgdGFibGUgdGFsbCBidWlsZGluZ3MgKDMwMG0rKSBjdXJyZW50bHkgdW5kZXIgY29uc3RydWN0aW9uIA0KZnJvbSBodHRwczovL2VuLndpa2lwZWRpYS5vcmcvd2lraS9MaXN0X29mX3RhbGxlc3RfYnVpbGRpbmdzX2luX3RoZV93b3JsZA0KVGFibGU6IExpc3QgYnkgY29udGluZW50DQoqDQoNCmBgYHtyfQ0KdXJsIDwtICAiaHR0cHM6Ly9lbi53aWtpcGVkaWEub3JnL3dpa2kvTGlzdF9vZl90YWxsZXN0X2J1aWxkaW5nc19pbl90aGVfd29ybGQiDQogaCA8LSByZWFkX2h0bWwodXJsKQ0KIHRhYiA8LSBoICU+JSBodG1sX25vZGVzKCJ0YWJsZSIpDQogdGFiIDwtIHRhYltbN11dICU+JSBodG1sX3RhYmxlDQp0YWIgPC0gdGFiICU+JSBzZXROYW1lcyhjKCJDb3VudGluZW50IiwgIkJ1aWxkaW5nIiwgImhlaWdodCIgLCAiRmxvb3JzIENvdW50IiwgIkNvbXBsZXRlZCIgLCAgICJDb3VudHJ5IiwgIkNpdHkiICkpDQp0YWINCmBgYA0KDQoqDQo2LiBTY3JhcGUgdGhlIHRhYmxlIGZvciBlZGl0b3JpYWwtYm9hcmQtbWVtYmVycyANCmZyb20gaHR0cDovL3d3dy5pamVhaXMub3JnL2lqZWFpcy9pbmRleC5waHAvZWRpdG9yaWFsLWJvYXJkLW1lbWJlcnMvDQoqDQoNCmBgYHtyfQ0KdXJsIDwtICAiaHR0cDovL3d3dy5pamVhaXMub3JnL2lqZWFpcy9pbmRleC5waHAvZWRpdG9yaWFsLWJvYXJkLW1lbWJlcnMvIg0KIGggPC0gcmVhZF9odG1sKHVybCkNCiB0YWIgPC0gaCAlPiUgaHRtbF9ub2RlcygidGFibGUiKQ0KIHRhYiA8LSB0YWJbWzFdXSAlPiUgaHRtbF90YWJsZQ0KdGFiIDwtIHRhYiAlPiUgc2V0TmFtZXMoYygiTmFtZSIsIkJyYW5jaCIsIkluc3RpdHV0aW9uL0FmZmlsaWF0aW9uIiwiQ291bnRyeSIgKSkNCnRhYg0KYGBgDQoNCg0KKg0KNy4gU2NyYXAgdGl0bGVzIGZyb20gdGhpcyB3ZWJwYWdlIA0KaHR0cHM6Ly93d3cuaW1kYi5jb20vc2VhcmNoL3RpdGxlLz90aXRsZV90eXBlPWZlYXR1cmUmbnVtX3ZvdGVzPTI1MDAwLCZnZW5yZXM9YWR2ZW50dXJlIA0KKg0KDQpgYGB7cn0NCiBodG1sX0NvbnRlbnQgPC0gcmVhZF9odG1sKCJodHRwczovL3d3dy5pbWRiLmNvbS9zZWFyY2gvdGl0bGUvP3RpdGxlX3R5cGU9ZmVhdHVyZSZudW1fdm90ZXM9MjUwMDAsJmdlbnJlcz1hZHZlbnR1cmUiKSANCiAgDQp0aXRsZXMgPC0gIGh0bWxfQ29udGVudCAlPiUgaHRtbF9ub2RlcygiLmxpc3Rlci1pdGVtLWhlYWRlciIpICU+JSBodG1sX25vZGUoImEiKSAlPiUNCiAgICBodG1sX3RleHQoKQ0KDQpsaWJyYXJ5KHN0cmluZ3IpDQp0aXRsZXMgPC0gc3RyX3JlcGxhY2VfYWxsKHRpdGxlcywgIltcclxuXSIgLCAiIikNCnRpdGxlcyA8LSBzdHJfcmVwbGFjZV9hbGwodGl0bGVzLCAiICIgLCAiIikNCg0KDQp0aXRsZXNfZGF0YSA8LSBjbGFzcy5kZjwtIGRhdGEuZnJhbWUodGl0bGVzKQ0KdGl0bGVzX2RhdGENCmBgYA0KDQoNCioNCjguIFNjcmFwIFllYXJzIGZyb20gdGhpcyB3ZWJwYWdlIA0KaHR0cHM6Ly93d3cuaW1kYi5jb20vc2VhcmNoL3RpdGxlLz90aXRsZV90eXBlPWZlYXR1cmUmbnVtX3ZvdGVzPTI1MDAwLCZnZW5yZXM9YWR2ZW50dXJlDQoNCiAqDQoNCmBgYHtyfQ0KIA0KeWVhcnMgPC0gIGh0bWxfQ29udGVudCAlPiUgaHRtbF9ub2RlcygiLmxpc3Rlci1pdGVtLXllYXIiKSAlPiUNCiAgICBodG1sX3RleHQoKQ0KDQoNCiAgeWVhcnNfZGF0YSA8LSBjbGFzcy5kZjwtIGRhdGEuZnJhbWUoeWVhcnMpDQp5ZWFyc19kYXRhDQpgYGANCg0KDQoqDQo5LiBTY3JhcCBSYXRpbmdzIGZyb20gdGhpcyB3ZWJwYWdlIA0KaHR0cHM6Ly93d3cuaW1kYi5jb20vc2VhcmNoL3RpdGxlLz90aXRsZV90eXBlPWZlYXR1cmUmbnVtX3ZvdGVzPTI1MDAwLCZnZW5yZXM9YWR2ZW50dXJlDQoNCg0KICoNCg0KYGBge3J9DQogDQogDQpyYXRpbmdzIDwtICBodG1sX0NvbnRlbnQgJT4lIGh0bWxfbm9kZXMoIi5yYXRpbmdzLWltZGItcmF0aW5nIikgJT4lDQogICAgaHRtbF90ZXh0KCkNCg0KcmF0aW5ncyA8LSBzdHJfcmVwbGFjZV9hbGwocmF0aW5ncywgIltcclxuXSIgLCAiIikNCnJhdGluZ3MgPC0gc3RyX3JlcGxhY2VfYWxsKHJhdGluZ3MsICIgIiAsICIiKQ0KDQogIHJhdGluZ3NfZGF0YSA8LSBjbGFzcy5kZjwtIGRhdGEuZnJhbWUocmF0aW5ncykNCnJhdGluZ3NfZGF0YQ0KYGBgDQoNCg0KKg0KMTAuICBTY3JhcCB0aGUgc3lub3BzaXMgb2YgdGhlIG1vdmllcyBmcm9tIHRoaXMgd2VicGFnZQ0KaHR0cHM6Ly93d3cuaW1kYi5jb20vc2VhcmNoL3RpdGxlLz90aXRsZV90eXBlPWZlYXR1cmUmbnVtX3ZvdGVzPTI1MDAwLCZnZW5yZXM9YWR2ZW50dXJlDQpVc2U6IC5yYXRpbmdzLWJhcisgLnRleHQtbXV0ZWQNCg0KKg0KDQoNCmBgYHtyfQ0Kc3lub3BzaXMgPC0gIGh0bWxfQ29udGVudCAlPiUgaHRtbF9ub2RlcygiLnJhdGluZ3MtYmFyKyAudGV4dC1tdXRlZCIpICU+JQ0KICAgIGh0bWxfdGV4dCgpDQoNCnN5bm9wc2lzIDwtIHN0cl9yZXBsYWNlX2FsbChzeW5vcHNpcywgIltcclxuXSIgLCAiIikNCnN5bm9wc2lzIDwtIHN0cl9yZXBsYWNlX2FsbChzeW5vcHNpcywgIiAiICwgIiIpDQoNCnN5bm9wc2lzX2RhdGEgPC0gY2xhc3MuZGY8LSBkYXRhLmZyYW1lKHN5bm9wc2lzKQ0Kc3lub3BzaXNfZGF0YQ0KICANCmBgYA0KDQoNCioNCjExLiBDcmVhdGUgYSBkYXRhIGZyYW1lIHVzaW5nIG91ciB2YXJpYWJsZXMgYXMgYSBjb2x1bW4gZnJvbSAjN+KApi4uIzEwDQoqDQoNCg0KYGBge3J9DQpjb21wbGV0ZV9kYXRhIDwtIGNsYXNzLmRmPC0gZGF0YS5mcmFtZSh0aXRsZXMgLCB5ZWFycyAscmF0aW5ncyAsICBzeW5vcHNpcyApDQpjb21wbGV0ZV9kYXRhDQoNCmBgYA0KDQoNCg==