In this research we’re analyzing 227,496 (nrow(hflights)) data entries from the hflights data package containing commercial domestic flights that departed Houston (IAH and HOU) in 2011.The data comes from the Research and Innovation Technology Administration at the Bureau of Transporation statistics.
## libraries
library(dplyr)
library(hflights)
library(scales)

## Cleaning data
column <- c( "year", "month", "day_of_month", "day_of_week", "dep_time", "arr_time", "unique_carrier", "flight_num", "tail_num", "actual_elapsed_time", "air_time", "arr_delay", "dep_delay", "origin", "destination", "distance", "taxi_in", "taxi_out", "cancelled", "cancellation_code", "diverted")

colnames(hflights) <- column
Displaying out a summary with variables min_distance and max_distance
summarise(hflights, min_distance=min(distance), max_distance=max(distance))
##   min_distance max_distance
## 1           79         3904
summarise(hflights, avg_distance=mean(distance), standard_dev=sd(distance))
##   avg_distance standard_dev
## 1     787.7832     453.6806