library(tidyverse)

## ── Attaching core tidyverse packages ──────────────────────── tidyverse 2.0.0 ──
## ✔ dplyr     1.1.4     ✔ readr     2.1.5
## ✔ forcats   1.0.0     ✔ stringr   1.5.1
## ✔ ggplot2   3.5.1     ✔ tibble    3.2.1
## ✔ lubridate 1.9.3     ✔ tidyr     1.3.1
## ✔ purrr     1.0.2     
## ── Conflicts ────────────────────────────────────────── tidyverse_conflicts() ──
## ✖ dplyr::filter() masks stats::filter()
## ✖ dplyr::lag()    masks stats::lag()
## ℹ Use the conflicted package (<http://conflicted.r-lib.org/>) to force all conflicts to become errors

library(tmap)

## Breaking News: tmap 3.x is retiring. Please test v4, e.g. with
## remotes::install_github('r-tmap/tmap')

library(units)

## udunits database from /Library/Frameworks/R.framework/Versions/4.3-arm64/Resources/library/units/share/udunits/udunits2.xml

library(sf)

## Linking to GEOS 3.11.0, GDAL 3.5.3, PROJ 9.1.0; sf_use_s2() is TRUE

library(leaflet)
library(dbscan)

## 
## Attaching package: 'dbscan'
## 
## The following object is masked from 'package:stats':
## 
##     as.dendrogram

library(sfnetworks)
library(tigris)

## To enable caching of data, set `options(tigris_use_cache = TRUE)`
## in your R script or .Rprofile.

library(tidygraph)

## 
## Attaching package: 'tidygraph'
## 
## The following object is masked from 'package:stats':
## 
##     filter

library(plotly)

## 
## Attaching package: 'plotly'
## 
## The following object is masked from 'package:ggplot2':
## 
##     last_plot
## 
## The following object is masked from 'package:stats':
## 
##     filter
## 
## The following object is masked from 'package:graphics':
## 
##     layout

library(osmdata)

## Data (c) OpenStreetMap contributors, ODbL 1.0. https://www.openstreetmap.org/copyright

library(here)

## here() starts at /Users/jaeglee/Library/CloudStorage/OneDrive-GeorgiaInstituteofTechnology/2024 Fall/UA/UA_R

library(tidytransit)
library(tidycensus)
library(leafsync)

epsg <- 4326

Step 1. Download Required data from GTFS.

# TASK ////////////////////////////////////////////////////////////////////////
# Download MARTA (Metropolitan Atlanta Rapid Transit Authority) GTFS data using `read_gtfs()` function and assign it to `gtfs` object
gtfs <- read_gtfs("https://www.itsmarta.com/google_transit_feed/google_transit.zip")
# //TASK //////////////////////////////////////////////////////////////////////



# =========== NO MODIFICATION ZONE STARTS HERE ===============================
# Edit stop_name to append serial numbers (1, 2, etc.) to remove duplicate names
stop_dist <- stop_group_distances(gtfs$stops, by='stop_name') %>%
  filter(dist_max > 200)

gtfs$stops <- gtfs$stops %>% 
  group_by(stop_name) %>% 
  mutate(stop_name = case_when(stop_name %in% stop_dist$stop_name ~ paste0(stop_name, " (", seq(1,n()), ")"),
                               TRUE ~ stop_name))

# Create a transfer table
gtfs <- gtfsrouter::gtfs_transfer_table(gtfs, 
                                        d_limit = 200, 
                                        min_transfer_time = 120)

## Registered S3 method overwritten by 'gtfsrouter':
##   method       from  
##   summary.gtfs gtfsio

# NOTE: Converting to sf format uses stop_lat and stop_lon columns contained in gtfs$stops.
#       In the conversion process, stop_lat and stop_lon are converted into a geometry column, and
#       the output sf object do not have the lat lon column anymore.
#       But many other functions in tidytransit look for stop_lat and stop_lon.
#       So I re-create them using mutate().
gtfs <- gtfs %>% gtfs_as_sf(crs = epsg)

gtfs$stops <- gtfs$stops %>% 
  ungroup() %>% 
  mutate(stop_lat = st_coordinates(.)[,2],
         stop_lon = st_coordinates(.)[,1]) 

# Get stop_id for Subway or Metro
rail_stops <- gtfs$routes %>% 
  filter(route_type %in% c(1)) %>% 
  inner_join(gtfs$trips, by = "route_id") %>% 
  inner_join(gtfs$stop_times, by = "trip_id") %>% 
  inner_join(gtfs$stops, by = "stop_id") %>% 
  group_by(stop_id) %>% 
  slice(1) %>% 
  pull(stop_id)

# Extract MARTA rail stations
station <- gtfs$stops %>% filter(stop_id %in% rail_stops)

# Extract Midtown Station
midtown <- gtfs$stops %>% filter(stop_id == "134")

# Create a bounding box to which we limit our analysis
bbox <- st_bbox(c(xmin = -84.45241, ymin = 33.72109, xmax = -84.35009, ymax = 33.80101), 
                 crs = st_crs(4326)) %>% 
  st_as_sfc()

# =========== NO MODIFY ZONE ENDS HERE ========================================

Step 2. Download Required data from Census

# TASK ////////////////////////////////////////////////////////////////////////
# Specify Census API key whichever you prefer using census_api_key() function
census_api_key(Sys.getenv("census_api"))

## To install your API key for use in future sessions, run this function with `install = TRUE`.

# //TASK //////////////////////////////////////////////////////////////////////

# TASK ////////////////////////////////////////////////////////////////////////
# Using get_acs() function, download Census Tract level data for 2022 for Fulton, DeKalb, and Clayton in GA.
# and assign it to `census` object.
# Make sure you set geometry = TRUE.

# Required data from the Census ACS:
#  1) Median Household Income (name the column `hhinc`)
#  2) Minority Population (%) (name the column `pct_minority`)
# Note: You may need to download two or more Census ACS variables to calculate minority population (%). "Minority" here can refer to either racial minorities or racial+ethnic minorities -- it's your choice.
census_var <- c(
  hhincome = 'B19019_001',
  pop = "B02001_001",
  race.white = "B02001_002",
  race.black = 'B02001_003',
  race.american_indian = 'B02001_004',
  race.asian = 'B02001_005',
  race.pacific_islander = 'B02001_006',
  hispanic_or_latino = 'B03003_003') # hispanic or latino is more of ethnicity rather than race, but I included them to calculate the proportion of minority populations

census <- get_acs(geography = "tract", state = "GA", county = c("Fulton", "DeKalb", "Clayton"),
                 output = "wide", geometry = TRUE, year = 2022,
                 variables = census_var)

## Getting data from the 2018-2022 5-year ACS

## Downloading feature geometry from the Census website.  To cache shapefiles for use in future sessions, set `options(tigris_use_cache = TRUE)`.

##   |                                                                              |                                                                      |   0%  |                                                                              |=                                                                     |   1%  |                                                                              |==                                                                    |   2%  |                                                                              |==                                                                    |   3%  |                                                                              |===                                                                   |   4%  |                                                                              |====                                                                  |   5%  |                                                                              |====                                                                  |   6%  |                                                                              |=====                                                                 |   7%  |                                                                              |======                                                                |   8%  |                                                                              |======                                                                |   9%  |                                                                              |=======                                                               |  10%  |                                                                              |========                                                              |  11%  |                                                                              |========                                                              |  12%  |                                                                              |=========                                                             |  12%  |                                                                              |=========                                                             |  13%  |                                                                              |==========                                                            |  14%  |                                                                              |==========                                                            |  15%  |                                                                              |===========                                                           |  15%  |                                                                              |===========                                                           |  16%  |                                                                              |============                                                          |  17%  |                                                                              |============                                                          |  18%  |                                                                              |=============                                                         |  18%  |                                                                              |=============                                                         |  19%  |                                                                              |==============                                                        |  20%  |                                                                              |==============                                                        |  21%  |                                                                              |===============                                                       |  21%  |                                                                              |===============                                                       |  22%  |                                                                              |================                                                      |  23%  |                                                                              |=================                                                     |  24%  |                                                                              |=================                                                     |  25%  |                                                                              |==================                                                    |  26%  |                                                                              |===================                                                   |  26%  |                                                                              |===================                                                   |  27%  |                                                                              |====================                                                  |  28%  |                                                                              |====================                                                  |  29%  |                                                                              |=====================                                                 |  29%  |                                                                              |=====================                                                 |  30%  |                                                                              |======================                                                |  31%  |                                                                              |======================                                                |  32%  |                                                                              |=======================                                               |  32%  |                                                                              |=======================                                               |  33%  |                                                                              |========================                                              |  34%  |                                                                              |========================                                              |  35%  |                                                                              |=========================                                             |  35%  |                                                                              |=========================                                             |  36%  |                                                                              |==========================                                            |  37%  |                                                                              |==========================                                            |  38%  |                                                                              |===========================                                           |  38%  |                                                                              |===========================                                           |  39%  |                                                                              |============================                                          |  40%  |                                                                              |=============================                                         |  41%  |                                                                              |=============================                                         |  42%  |                                                                              |==============================                                        |  43%  |                                                                              |===============================                                       |  44%  |                                                                              |===============================                                       |  45%  |                                                                              |================================                                      |  46%  |                                                                              |=================================                                     |  48%  |                                                                              |==================================                                    |  49%  |                                                                              |===================================                                   |  49%  |                                                                              |===================================                                   |  50%  |                                                                              |====================================                                  |  51%  |                                                                              |====================================                                  |  52%  |                                                                              |=====================================                                 |  52%  |                                                                              |=====================================                                 |  53%  |                                                                              |======================================                                |  54%  |                                                                              |=======================================                               |  55%  |                                                                              |=======================================                               |  56%  |                                                                              |========================================                              |  57%  |                                                                              |=========================================                             |  58%  |                                                                              |=========================================                             |  59%  |                                                                              |==========================================                            |  60%  |                                                                              |===========================================                           |  61%  |                                                                              |===========================================                           |  62%  |                                                                              |============================================                          |  63%  |                                                                              |=============================================                         |  64%  |                                                                              |=============================================                         |  65%  |                                                                              |==============================================                        |  66%  |                                                                              |===============================================                       |  67%  |                                                                              |===============================================                       |  68%  |                                                                              |================================================                      |  69%  |                                                                              |=================================================                     |  70%  |                                                                              |==================================================                    |  71%  |                                                                              |===================================================                   |  72%  |                                                                              |===================================================                   |  73%  |                                                                              |====================================================                  |  74%  |                                                                              |=====================================================                 |  75%  |                                                                              |=====================================================                 |  76%  |                                                                              |======================================================                |  77%  |                                                                              |=======================================================               |  78%  |                                                                              |=======================================================               |  79%  |                                                                              |========================================================              |  80%  |                                                                              |=========================================================             |  81%  |                                                                              |=========================================================             |  82%  |                                                                              |==========================================================            |  83%  |                                                                              |===========================================================           |  84%  |                                                                              |===========================================================           |  85%  |                                                                              |============================================================          |  85%  |                                                                              |============================================================          |  86%  |                                                                              |=============================================================         |  87%  |                                                                              |=============================================================         |  88%  |                                                                              |==============================================================        |  88%  |                                                                              |==============================================================        |  89%  |                                                                              |===============================================================       |  90%  |                                                                              |===============================================================       |  91%  |                                                                              |================================================================      |  91%  |                                                                              |================================================================      |  92%  |                                                                              |=================================================================     |  93%  |                                                                              |==================================================================    |  94%  |                                                                              |===================================================================   |  95%  |                                                                              |===================================================================   |  96%  |                                                                              |====================================================================  |  97%  |                                                                              |===================================================================== |  98%  |                                                                              |===================================================================== |  99%  |                                                                              |======================================================================|  99%  |                                                                              |======================================================================| 100%

census <- census %>%
  dplyr::select(!dplyr::ends_with("M")) %>%
  rename(hhinc = hhincomeE) %>%
  mutate(pct_minority = (race.blackE + race.american_indianE + race.asianE + race.pacific_islanderE + hispanic_or_latinoE) / popE * 100) %>%
  select(GEOID, NAME, hhinc, pct_minority)

# //TASK //////////////////////////////////////////////////////////////////////

# =========== NO MODIFICATION ZONE STARTS HERE ===============================
census <- census %>% 
  st_transform(crs = 4326) %>% 
  separate(col = NAME, into = c("tract", "county", "state"), sep = "; ")

# Convert it to POINT at polygon centroids and extract those that fall into bbox
# and assign it into `home` object
home <- census %>% st_centroid() %>% .[bbox,]

## Warning: st_centroid assumes attributes are constant over geometries

# =========== NO MODIFY ZONE ENDS HERE ========================================

Step 3. Download Required data from OSM.

# TASK ////////////////////////////////////////////////////////////////////////
# 1. Get OSM data using opq() function and bbox object defined in the previous code chunk.
# 2. Specify arguments for add_osm_feature() function using 
#    key = 'highway' and 
#    value = c("motorway", "trunk", "primary", "secondary", "tertiary", "residential", 
#              "motorway_link", "trunk_link", "primary_link", "secondary_link", 
#              "tertiary_link", "residential_link", "unclassified")
# 3. Convert the OSM data into an sf object using osmdata_sf() function
# 4. Convert osmdata polygons into lines using osm_poly2line() function

osm_road <- opq(bbox = bbox) %>%
  add_osm_feature(key = 'highway', 
                  value = c("motorway", "trunk", "primary", "secondary", "tertiary", "residential", 
                            "motorway_link", "trunk_link", "primary_link", "secondary_link", 
                            "tertiary_link", "residential_link", "unclassified")) %>%
  osmdata_sf() %>% 
  osm_poly2line()

tm_shape(osm_road$osm_lines) + tm_lines(col = "highway")

# //TASK //////////////////////////////////////////////////////////////////////


# TASK ////////////////////////////////////////////////////////////////////////
# 1. Convert osm_road$osm_lines into sfnetwork using as_sfnetwork() function
# 2. Activate edges
# 3. Clean the network using edge_is_multiple(), edge_is_loop(), to_spatial_subdivision(), to_spatial_smooth()
# 4. Assign the cleaned network to an object named 'osm'

osm <- osm_road$osm_line %>% 
  select(osm_id, highway) %>%
  sfnetworks::as_sfnetwork(directed = F) %>%
  activate("edges") %>%
  filter(!edge_is_multiple()) %>%
  filter(!edge_is_loop()) %>% 
  convert(., sfnetworks::to_spatial_subdivision) %>% 
  convert(., sfnetworks::to_spatial_smooth)

## Warning: to_spatial_subdivision assumes attributes are constant over geometries

# //TASK //////////////////////////////////////////////////////////////////////



# TASK ////////////////////////////////////////////////////////////////////////
# Add a new column named 'length' to the edges part of the object `osm`.
osm <- osm %>% 
  st_transform(4326) %>% activate("edges") %>% 
  mutate(length = edge_length())
# //TASK //////////////////////////////////////////////////////////////////////

Step 4. Simulate a park-and-ride trip (home -> closest station -> Midtown station).

# =========== NO MODIFICATION ZONE STARTS HERE ===============================
# Extract the first row from `home` object and store it `home_1`
home_1 <- home[1,]
# =========== NO MODIFY ZONE ENDS HERE ========================================


# TASK ////////////////////////////////////////////////////////////////////////
# Find the shortest path from `home_1` to all other stations
# using st_network_paths() function.
rail_stops_point <- gtfs$stops %>% filter(stop_id %in% rail_stops) %>% st_geometry()
paths <- st_network_paths(osm, from = home_1, to = rail_stops_point, type = "shortest")
# //TASK //////////////////////////////////////////////////////////////////////

  
# =========== NO MODIFICATION ZONE STARTS HERE ===============================
# Using the `paths` object, get network distances from `home_1` to all other stations.
dist_all <- map_dbl(1:nrow(paths), function(x){
  osm %>%
    activate("nodes") %>% 
    slice(paths$node_paths[[x]]) %>% 
    st_as_sf("edges") %>% 
    pull(length) %>% 
    sum()   # osm has a list structure
}) %>% unlist() 

# Replace zeros with a large value.
if (any(dist_all == 0)){
  dist_all[dist_all == 0] <- max(dist_all)
}

# Find the closest station.
closest_index <- which.min(dist_all)
closest_station <- station[closest_index,]

# Find the distance to the closest station.
closest_dist <- min(dist_all)

# Calculate how long it takes to traverse `closest_dist` 
# assuming we drive at 30 miles/hour speed.
# Store the output in trvt_osm_m.
car_speed <- set_units(30, mile/h)
trvt_osm_m <- closest_dist/set_units(car_speed, m/min) %>%  # Distance divided by 30 mile/h
  as.vector(.)
# =========== NO MODIFY ZONE ENDS HERE ========================================


# TASK ////////////////////////////////////////////////////////////////////////
# 1. From `osm` object, activate nodes part and
# 2. use `closest_index` to extract the selected path
paths_closest <- osm %>%
  activate("nodes") %>%
  slice(paths$node_paths[[closest_index]])
# //TASK //////////////////////////////////////////////////////////////////////


# TASK ////////////////////////////////////////////////////////////////////////
# Use filter_stop_times() function to create a subset of stop_times data table
# for date = 2024-11-14, minimum departure time of 7AM, maximum departure time of 10AM.
# Assign the output to `am_stop_time` object
am_stop_time <- filter_stop_times(gtfs_obj = gtfs, 
                                  extract_date = "2024-11-14",
                                  min_departure_time = 3600*7, 
                                  max_arrival_time = 3600*10) 
# //TASK //////////////////////////////////////////////////////////////////////



# TASK ////////////////////////////////////////////////////////////////////////
# 1. Use travel_times() function to calculate travel times from the `closest_station` 
#    to all other stations during time specified in am_stop_time. Allow ONE transfer.
# 2. Filter the row for which the value of 'to_stop_name' column 
#    equals midtown$stop_name. Assign it into `trvt` object.
trvt <- travel_times(filtered_stop_times = am_stop_time,
                     stop_name = closest_station$stop_name, # ASHBY STATION
                     time_range = 3600,
                     arrival = FALSE, # if TRUE, all journeys end at Midtown station.
                     max_transfers = 1,
                     return_coords = TRUE) %>%
  filter(to_stop_name == midtown$stop_name)
trvt

## # A tibble: 1 × 12
##   from_stop_name to_stop_name    travel_time journey_departure_time
##   <chr>          <chr>                 <dbl> <time>                
## 1 ASHBY STATION  MIDTOWN STATION         840 07:02                 
## # ℹ 8 more variables: journey_arrival_time <time>, transfers <int>,
## #   from_stop_id <chr>, to_stop_id <chr>, from_stop_lon <dbl>,
## #   from_stop_lat <dbl>, to_stop_lon <dbl>, to_stop_lat <dbl>

# //TASK //////////////////////////////////////////////////////////////////////



# =========== NO MODIFICATION ZONE STARTS HERE ===============================
# Divide the calculated travel time by 60 to convert the unit from seconds to minutes.
trvt_gtfs_m <- trvt$travel_time/60

# Add the travel time from home to the nearest station and
# the travel time from the nearest station to Midtown station
total_trvt <- trvt_osm_m + trvt_gtfs_m
# =========== NO MODIFY ZONE ENDS HERE ========================================

Step 5. Convert Step 4 into a function

# Function definition (do not modify other parts of the code in this code chunk except for those inside the TASK section)

get_trvt <- function(home, osm, station, midtown){
  
  rail_stops_point <- gtfs$stops %>% filter(stop_id %in% rail_stops) %>% st_geometry()
  paths <- st_network_paths(osm, from = home, to = rail_stops_point, type = "shortest")

  # Using the `paths` object, get network distances from `home` to all other stations.
  dist_all <- map_dbl(1:nrow(paths), function(x){
    osm %>%
      activate("nodes") %>% 
      slice(paths$node_paths[[x]]) %>% 
      st_as_sf("edges") %>% 
      pull(length) %>% 
      sum()   # osm has a list structure
  }) %>% unlist() 
  
  # Replace zeros with a large value.
  if (any(dist_all == 0)){
    dist_all[dist_all == 0] <- max(dist_all)
  }
  
  # Find the closest station.
  closest_index <- which.min(dist_all)
  closest_station <- station[closest_index,]
  
  # Find the distance to the closest station.
  closest_dist <- min(dist_all)
  
  # Calculate how long it takes to traverse `closest_dist` 
  # assuming we drive at 30 miles/hour speed.
  # Store the output in trvt_osm_m.
  car_speed <- set_units(30, mile/h)
  trvt_osm_m <- closest_dist/set_units(car_speed, m/min) %>%  # Distance divided by 30 mile/h
    as.vector(.)

  # 1. From `osm` object, activate nodes part and
  # 2. use `closest_index` to extract the selected path
  paths_closest <- osm %>%
    activate("nodes") %>%
    slice(paths$node_paths[[closest_index]])

  # Use filter_stop_times() function to create a subset of stop_times data table
  # for date = 2024-11-14, minimum departure time of 7AM, maximum departure time of 10AM.
  # Assign the output to `am_stop_time` object
  am_stop_time <- filter_stop_times(gtfs_obj = gtfs, 
                                    extract_date = "2024-11-14",
                                    min_departure_time = 3600*7, 
                                    max_arrival_time = 3600*10) 

  # 1. Use travel_times() function to calculate travel times from the `closest_station` 
  #    to all other stations during time specified in am_stop_time. Allow ONE transfer.
  # 2. Filter the row for which the value of 'to_stop_name' column 
  #    equals midtown$stop_name. Assign it into `trvt` object.
  trvt <- travel_times(filtered_stop_times = am_stop_time,
                       stop_name = closest_station$stop_name, # ASHBY STATION
                       time_range = 3600,
                       arrival = FALSE, # if TRUE, all journeys end at Midtown station.
                       max_transfers = 1,
                       return_coords = TRUE) %>%
    filter(to_stop_name == midtown$stop_name)
  trvt

  # Divide the calculated travel time by 60 to convert the unit from seconds to minutes.
  trvt_gtfs_m <- trvt$travel_time/60
  
  # Add the travel time from home to the nearest station and
  # the travel time from the nearest station to Midtown station
  total_trvt <- trvt_osm_m + trvt_gtfs_m

  if (length(total_trvt) == 0) {total_trvt = 0}

  return(total_trvt)
}

Step 6. Apply the function for the whole study area

# Prepare an empty vector
total_trvt <- vector("numeric", nrow(home))

# Apply the function for all Census Tracts
# Fill `total_trvt` object with the calculated time
for (i in 1:nrow(home)){
  total_trvt[i] <- get_trvt(home[i,], osm, station, midtown)
}

# Cbind the calculated travel time back to `home`
home_done <- home %>% 
  cbind(trvt = total_trvt)

Step 7. Create maps and plots

Run the code below to generate thematic maps and plots

Write a short description of what you observe from the maps and plots

# Join routes table with trips table with shapes table
trip_routes <- gtfs$trips %>% 
  full_join(gtfs$routes, by = "route_id")

trip_shape <- gtfs$shapes %>% 
  full_join(gtfs$trips %>% 
              select(shape_id, trip_id), 
            by = "shape_id")

# Merging the two into one and then taking only one row for each
# unique combination of route_id and shape_id.
route_trip_shape <- trip_shape %>% 
  select(-shape_id) %>% 
  full_join(trip_routes, by = c("trip_id")) %>% 
  group_by(shape_id, route_id) %>% 
  slice(1)

# Route type is not really intuitive - let's fix that
route_shape <- route_trip_shape %>% 
  mutate(route_type = case_when(
    route_type == "0" ~ 'Tram, Streetcar',
    route_type == "1" ~ 'Subway, Metro',
    route_type == "2" ~ 'Rail',
    route_type == "3" ~ 'Bus'
  ))

tmap_mode('view')

## tmap mode set to interactive viewing

tm_shape(route_shape %>%
           filter(route_type == 'Subway, Metro')) + 
  tm_lines()

# Map
tmap_mode('view')

## tmap mode set to interactive viewing

tm_shape(census[census$GEOID %in% home$GEOID,]) + 
  tm_polygons(col = "hhinc", palette = 'GnBu', title = "Household Income", alpha = 0.5) + 
  tm_shape(home_done) + 
  tm_dots(col = "trvt", palette = 'Reds', size = 0.1, title = "Travel Time") + 
  tm_shape(midtown) + 
  tm_dots(col = "black", size = 0.1,) +
  tm_shape(route_shape %>%
              filter(route_type == 'Subway, Metro')) + 
  tm_lines(size = 0.1, alpha = 0.3)

tm_shape(census[census$GEOID %in% home$GEOID,]) + 
  tm_polygons(col = "pct_minority", palette = 'GnBu', title = "Percentage of minorities", alpha = 0.5) + 
  tm_shape(home_done) + 
  tm_dots(col = "trvt", palette = 'Reds', size = 0.1, title = "Travel Time") + 
  tm_shape(midtown) + 
  tm_dots(col = "black", size = 0.1,) +
  tm_shape(route_shape %>%
              filter(route_type == 'Subway, Metro')) + 
  tm_lines(size = 0.1, alpha = 0.3)

# ggplot
inc <- ggplot(data = home_done,
              aes(x = hhinc, y = trvt)) +
  geom_point() +
  geom_smooth(method = "lm", se = FALSE) +
  labs(x = "Median Annual Household Income",
       y = "Park-and-ride Travel Time from Home to Midtown Station") +
  theme_bw()

minority <- ggplot(data = home_done,
                   aes(x = pct_minority, y = trvt)) +
  geom_point() +
  geom_smooth(method = "lm", se = FALSE) +
  labs(x = "Minority Population (%)",
       y = "Park-and-ride Travel Time from Home to Midtown Station") +
  theme_bw()


ggpubr::ggarrange(inc, minority)

## `geom_smooth()` using formula = 'y ~ x'

## Warning: Removed 6 rows containing non-finite outside the scale range
## (`stat_smooth()`).

## Warning: Removed 6 rows containing missing values or values outside the scale range
## (`geom_point()`).

## `geom_smooth()` using formula = 'y ~ x'

I added the location of the Midtown station and the route of subway lines on the top of the provided maps. I do not notice a statistical correlation that is noteworthy from the scatterplots. Rather, it is interesting that in each of the scatterplot there are two clusters that are devided in terms of the total travel time. At the same time, both when we see the distribution of travel times across median annual household income and minority population percentage, there is a cluster of travel times regardless of the level of each explanatory variable. I guess that these census tracts with short travel times to the Midtown station are mostly the ones geographically close to the Midtown station.

That being said, I feel that the issue of equity in travel times takes more place among the census tracts quite far from the Midtown station, which are likely to be consisting either the upward or the slightly downward association in the two scatterplots. First, census tracts with higher income seem to take longer time to get to the Midtown station. Those tracts are far from the city center and also do not have subway stations nearby. Historically, when the Marta subway system was developed, affluent neighborhoods were not interested in having subway stations nearby and occasionally even opposed to having them. Meanwhile, excluding some of the census tracts located on the eastern side of the study area with both high income level and lower minority level, generally speaking, census tracts with higher percentages of racial and ethnic minorities seem to take longer times to get to the Midtown station. This pattern stems from the fact that census tracts with higher percentages of minority are largely located in the southern and western part of Atlanta, being far from the Midtown station.

Besides this descriptive interpretation, we can also discuss how helpful the park-and-ride policy has been for the socioeconomic and demographic minorities. Despite the distance from the South Atlanta to the Midtown station, some of them take moderate amount of time to get to the Midtown station, which I guess is possible due to the subway lines running through from south to north. However, among the census tracts in the South Atlanta, I see that census tracts farther away from subway lines have longer times to travel to the Midtown station. This indicates that the subway line still does not fully cover the underprivileged neighborhoods in the South Atlanta. A more pressing issue is that many of the residents in those neighborhoods do not own car and therefore, in reality, will need to spend longer times than the ones calculated through our analysis to get to the Midtown station.

Major_assignment_1_template

Originally written by Bon Woo Koo & Subhro Guhathakurta; modified by Uijeong Hwang

2024-10-16