Import data

## [1] "/Users/taylornelson/Desktop/PSU_DAT3000_IntroToDA/03_module6"
## function (..., list = character(), package = NULL, lib.loc = NULL, 
##     verbose = getOption("verbose"), envir = .GlobalEnv, overwrite = TRUE) 
## {
##     fileExt <- function(x) {
##         db <- grepl("\\.[^.]+\\.(gz|bz2|xz)$", x)
##         ans <- sub(".*\\.", "", x)
##         ans[db] <- sub(".*\\.([^.]+\\.)(gz|bz2|xz)$", "\\1\\2", 
##             x[db])
##         ans
##     }
##     my_read_table <- function(...) {
##         lcc <- Sys.getlocale("LC_COLLATE")
##         on.exit(Sys.setlocale("LC_COLLATE", lcc))
##         Sys.setlocale("LC_COLLATE", "C")
##         read.table(...)
##     }
##     stopifnot(is.character(list))
##     names <- c(as.character(substitute(list(...))[-1L]), list)
##     if (!is.null(package)) {
##         if (!is.character(package)) 
##             stop("'package' must be a character vector or NULL")
##     }
##     paths <- find.package(package, lib.loc, verbose = verbose)
##     if (is.null(lib.loc)) 
##         paths <- c(path.package(package, TRUE), if (!length(package)) getwd(), 
##             paths)
##     paths <- unique(normalizePath(paths[file.exists(paths)]))
##     paths <- paths[dir.exists(file.path(paths, "data"))]
##     dataExts <- tools:::.make_file_exts("data")
##     if (length(names) == 0L) {
##         db <- matrix(character(), nrow = 0L, ncol = 4L)
##         for (path in paths) {
##             entries <- NULL
##             packageName <- if (file_test("-f", file.path(path, 
##                 "DESCRIPTION"))) 
##                 basename(path)
##             else "."
##             if (file_test("-f", INDEX <- file.path(path, "Meta", 
##                 "data.rds"))) {
##                 entries <- readRDS(INDEX)
##             }
##             else {
##                 dataDir <- file.path(path, "data")
##                 entries <- tools::list_files_with_type(dataDir, 
##                   "data")
##                 if (length(entries)) {
##                   entries <- unique(tools::file_path_sans_ext(basename(entries)))
##                   entries <- cbind(entries, "")
##                 }
##             }
##             if (NROW(entries)) {
##                 if (is.matrix(entries) && ncol(entries) == 2L) 
##                   db <- rbind(db, cbind(packageName, dirname(path), 
##                     entries))
##                 else warning(gettextf("data index for package %s is invalid and will be ignored", 
##                   sQuote(packageName)), domain = NA, call. = FALSE)
##             }
##         }
##         colnames(db) <- c("Package", "LibPath", "Item", "Title")
##         footer <- if (missing(package)) 
##             paste0("Use ", sQuote(paste("data(package =", ".packages(all.available = TRUE))")), 
##                 "\n", "to list the data sets in all *available* packages.")
##         else NULL
##         y <- list(title = "Data sets", header = NULL, results = db, 
##             footer = footer)
##         class(y) <- "packageIQR"
##         return(y)
##     }
##     paths <- file.path(paths, "data")
##     for (name in names) {
##         found <- FALSE
##         for (p in paths) {
##             tmp_env <- if (overwrite) 
##                 envir
##             else new.env()
##             if (file_test("-f", file.path(p, "Rdata.rds"))) {
##                 rds <- readRDS(file.path(p, "Rdata.rds"))
##                 if (name %in% names(rds)) {
##                   found <- TRUE
##                   if (verbose) 
##                     message(sprintf("name=%s:\t found in Rdata.rds", 
##                       name), domain = NA)
##                   objs <- rds[[name]]
##                   lazyLoad(file.path(p, "Rdata"), envir = tmp_env, 
##                     filter = function(x) x %in% objs)
##                   break
##                 }
##                 else if (verbose) 
##                   message(sprintf("name=%s:\t NOT found in names() of Rdata.rds, i.e.,\n\t%s\n", 
##                     name, paste(names(rds), collapse = ",")), 
##                     domain = NA)
##             }
##             files <- list.files(p, full.names = TRUE)
##             files <- files[grep(name, files, fixed = TRUE)]
##             if (length(files) > 1L) {
##                 o <- match(fileExt(files), dataExts, nomatch = 100L)
##                 paths0 <- dirname(files)
##                 paths0 <- factor(paths0, levels = unique(paths0))
##                 files <- files[order(paths0, o)]
##             }
##             if (length(files)) {
##                 for (file in files) {
##                   if (verbose) 
##                     message("name=", name, ":\t file= ...", .Platform$file.sep, 
##                       basename(file), "::\t", appendLF = FALSE, 
##                       domain = NA)
##                   ext <- fileExt(file)
##                   if (basename(file) != paste0(name, ".", ext)) 
##                     found <- FALSE
##                   else {
##                     found <- TRUE
##                     switch(ext, R = , r = {
##                       library("utils")
##                       sys.source(file, chdir = TRUE, envir = tmp_env)
##                     }, RData = , rdata = , rda = load(file, envir = tmp_env), 
##                       TXT = , txt = , tab = , tab.gz = , tab.bz2 = , 
##                       tab.xz = , txt.gz = , txt.bz2 = , txt.xz = assign(name, 
##                         my_read_table(file, header = TRUE, as.is = FALSE), 
##                         envir = tmp_env), CSV = , csv = , csv.gz = , 
##                       csv.bz2 = , csv.xz = assign(name, my_read_table(file, 
##                         header = TRUE, sep = ";", as.is = FALSE), 
##                         envir = tmp_env), found <- FALSE)
##                   }
##                   if (found) 
##                     break
##                 }
##                 if (verbose) 
##                   message(if (!found) 
##                     "*NOT* ", "found", domain = NA)
##             }
##             if (found) 
##                 break
##         }
##         if (!found) {
##             warning(gettextf("data set %s not found", sQuote(name)), 
##                 domain = NA)
##         }
##         else if (!overwrite) {
##             for (o in ls(envir = tmp_env, all.names = TRUE)) {
##                 if (exists(o, envir = envir, inherits = FALSE)) 
##                   warning(gettextf("an object named %s already exists and will not be overwritten", 
##                     sQuote(o)))
##                 else assign(o, get(o, envir = tmp_env, inherits = FALSE), 
##                   envir = envir)
##             }
##             rm(tmp_env)
##         }
##     }
##     invisible(names)
## }
## <bytecode: 0x10f5a2e30>
## <environment: namespace:utils>

Apply the following dplyr verbs to your data

Filter rows

## # A tibble: 662 × 31
##    town11cd  town11nm population_2011 size_flag rgn11nm coastal coastal_detailed
##    <chr>     <chr>              <dbl> <chr>     <chr>   <chr>   <chr>           
##  1 E34000007 Carlton…            5456 Small To… East M… Non-co… Smaller non-coa…
##  2 E34000016 Dorches…           19060 Small To… South … Non-co… Smaller non-coa…
##  3 E34000020 Ely BUA            19090 Small To… East o… Non-co… Smaller non-coa…
##  4 E34000026 Market …            6429 Small To… Yorksh… Non-co… Smaller non-coa…
##  5 E34000027 Downham…           10884 Small To… East o… Non-co… Smaller non-coa…
##  6 E34000039 Penrith…           15181 Small To… North … Non-co… Smaller non-coa…
##  7 E34000048 Bolsove…           11754 Small To… East M… Non-co… Smaller non-coa…
##  8 E34000056 Southam…            6567 Small To… West M… Non-co… Smaller non-coa…
##  9 E34000067 Royston…           15781 Small To… East o… Non-co… Smaller non-coa…
## 10 E34000068 Studley…            6203 Small To… West M… Non-co… Smaller non-coa…
## # ℹ 652 more rows
## # ℹ 24 more variables: ttwa11cd <chr>, ttwa11nm <chr>,
## #   ttwa_classification <chr>, job_density_flag <chr>, income_flag <chr>,
## #   university_flag <chr>, level4qual_residents35_64_2011 <chr>,
## #   ks4_2012_2013_counts <dbl>,
## #   key_stage_2_attainment_school_year_2007_to_2008 <dbl>,
## #   key_stage_4_attainment_school_year_2012_to_2013 <dbl>, …

Arrange rows

## # A tibble: 1,104 × 31
##    town11cd  town11nm population_2011 size_flag rgn11nm coastal coastal_detailed
##    <chr>     <chr>              <dbl> <chr>     <chr>   <chr>   <chr>           
##  1 E34000007 Carlton…            5456 Small To… East M… Non-co… Smaller non-coa…
##  2 E34000016 Dorches…           19060 Small To… South … Non-co… Smaller non-coa…
##  3 E34000020 Ely BUA            19090 Small To… East o… Non-co… Smaller non-coa…
##  4 E34000026 Market …            6429 Small To… Yorksh… Non-co… Smaller non-coa…
##  5 E34000027 Downham…           10884 Small To… East o… Non-co… Smaller non-coa…
##  6 E34000039 Penrith…           15181 Small To… North … Non-co… Smaller non-coa…
##  7 E34000048 Bolsove…           11754 Small To… East M… Non-co… Smaller non-coa…
##  8 E34000056 Southam…            6567 Small To… West M… Non-co… Smaller non-coa…
##  9 E34000067 Royston…           15781 Small To… East o… Non-co… Smaller non-coa…
## 10 E34000068 Studley…            6203 Small To… West M… Non-co… Smaller non-coa…
## # ℹ 1,094 more rows
## # ℹ 24 more variables: ttwa11cd <chr>, ttwa11nm <chr>,
## #   ttwa_classification <chr>, job_density_flag <chr>, income_flag <chr>,
## #   university_flag <chr>, level4qual_residents35_64_2011 <chr>,
## #   ks4_2012_2013_counts <dbl>,
## #   key_stage_2_attainment_school_year_2007_to_2008 <dbl>,
## #   key_stage_4_attainment_school_year_2012_to_2013 <dbl>, …

Select columns

## # A tibble: 1,104 × 1
##    size_flag   
##    <chr>       
##  1 Small Towns 
##  2 Small Towns 
##  3 Small Towns 
##  4 Small Towns 
##  5 Small Towns 
##  6 Small Towns 
##  7 Small Towns 
##  8 Medium Towns
##  9 Small Towns 
## 10 Small Towns 
## # ℹ 1,094 more rows

Summarize by groups

## # A tibble: 8 × 2
##   size_flag        avg_population
##   <chr>                     <dbl>
## 1 City                    395611 
## 2 Inner London BUA            NA 
## 3 Large Towns             117599.
## 4 Medium Towns             36899.
## 5 Not BUA                     NA 
## 6 Other Small BUAs            NA 
## 7 Outer london BUA            NA 
## 8 Small Towns              10393.