# ==============================================================================
# COPY/PASTE READY REFERENCE VALUES - GYNECOLOGIC ONCOLOGY ACCESSIBILITY PROJECT
# WITH OFFICIAL SOURCES AND CITATIONS
# ==============================================================================
# TAXONOMY CODES FOR OBGYN SUBSPECIALISTS
# Source: National Uniform Claim Committee (NUCC) Health Care Provider Taxonomy
# URL: https://taxonomy.nucc.org/
# Last Updated: Version 23.1 (July 2023)
obgyn_taxonomy_codes <- c(
"207V00000X", # Obstetrics & Gynecology (general)
"207VX0201X", # Gynecologic Oncology (PRIMARY FOCUS)
"207VE0102X", # Reproductive Endocrinology and Infertility
"207VG0400X", # Gynecology (general)
"207VM0101X", # Maternal & Fetal Medicine
"207VF0040X", # Female Pelvic Medicine/Urogynecology
"207VB0002X", # Bariatric Medicine
"207VC0200X", # Critical Care Medicine
"207VC0300X", # Complex Family Planning
"207VH0002X", # Hospice and Palliative Medicine
"207VX0000X" # Obstetrics only
)
# RUCA CODES (RURAL-URBAN COMMUTING AREAS)
# Source: USDA Economic Research Service
# URL: https://www.ers.usda.gov/data-products/rural-urban-commuting-area-codes/
# Publication: "Rural-Urban Commuting Area Codes" (2010 Census-based, most recent)
# Citation: USDA ERS. Rural-Urban Commuting Area Codes. Washington, DC: Economic Research Service; 2013.
ruca_codes_all <- c(1.0, 1.1, 2.0, 2.1, 3.0, 4.1, 4.2, 5.0, 5.1, 6.0, 6.1,
7.0, 7.1, 7.2, 7.3, 7.4, 8.0, 8.1, 8.2, 8.3, 8.4, 9.0,
10.0, 10.1, 10.2, 10.3, 10.4, 10.5, 10.6)
# RUCA SIMPLIFIED CATEGORIES
# Source: Hart LG, Larson EH, Lishner DM. Rural definitions for health policy research.
# Am J Public Health. 2005;95(7):1149-1155.
# Also: Morrill R, Cromartie J, Hart G. Metropolitan, urban, and rural commuting areas:
# toward a better depiction of the United States settlement system. Urban Geography. 1999;20(8):727-748.
ruca_metropolitan <- c(1.0, 1.1, 2.0, 2.1, 3.0) # Large metro areas
ruca_micropolitan <- c(4.1, 4.2, 5.0, 5.1, 6.0, 6.1) # Mid-size cities
ruca_small_town <- c(7.0, 7.1, 7.2, 7.3, 7.4, 8.0, 8.1, 8.2, 8.3, 8.4) # Small towns
ruca_rural <- c(9.0, 10.0, 10.1, 10.2, 10.3, 10.4, 10.5, 10.6) # Rural areas
# US CENSUS REGIONS AND DIVISIONS
# Source: US Census Bureau Geography Division
# URL: https://www2.census.gov/geo/pdfs/maps-data/maps/reference/us_regdiv.pdf
# Publication: "Geographic Areas Reference Manual" Chapter 6
# Citation: US Census Bureau. Geographic Areas Reference Manual. Washington, DC: US Census Bureau; 1994.
# Official Definition: Title 13, United States Code, Section 4
census_regions <- c("Northeast", "Midwest", "South", "West")
census_divisions <- c("New England", "Middle Atlantic", "East North Central",
"West North Central", "South Atlantic", "East South Central",
"West South Central", "Mountain", "Pacific")
# STATE ABBREVIATIONS BY CENSUS REGION
# Source: US Census Bureau, Geography Division
# URL: https://www.census.gov/geographies/reference-files/2010/geo/state-area.html
# Note: Established by Federal Information Processing Standards (FIPS) Publication 5-2
northeast_states <- c("CT", "ME", "MA", "NH", "RI", "VT", "NJ", "NY", "PA")
midwest_states <- c("IL", "IN", "MI", "OH", "WI", "IA", "KS", "MN", "MO", "NE", "ND", "SD")
south_states <- c("DE", "FL", "GA", "MD", "NC", "SC", "VA", "WV", "DC", "AL", "KY", "MS", "TN", "AR", "LA", "OK", "TX")
west_states <- c("AZ", "CO", "ID", "MT", "NV", "NM", "UT", "WY", "AK", "CA", "HI", "OR", "WA")
# ACOG DISTRICTS BY STATE
# Source: American College of Obstetricians and Gynecologists
# URL: https://www.acog.org/about/districts-and-sections
# Publication: ACOG Organization Manual, current as of 2023
# Citation: American College of Obstetricians and Gynecologists. District Organization. Washington, DC: ACOG; 2023.
acog_district_1 <- c("CT", "ME", "MA", "NH", "RI", "VT") # New England
acog_district_2 <- c("NY") # New York Metro
acog_district_3 <- c("DE", "NJ", "PA") # Mid-Atlantic
acog_district_4 <- c("DC", "MD", "VA", "WV") # Southeast
acog_district_5 <- c("AL", "FL", "GA", "MS", "SC", "TN") # Southeast
acog_district_6 <- c("IL", "IN", "IA", "KY", "MN", "MO", "NE", "ND", "OH", "SD", "WI") # Midwest/Plains
acog_district_7 <- c("AZ", "CO", "NV", "NM", "UT", "WY") # Mountain West
acog_district_8 <- c("AK", "ID", "MT", "OR", "WA") # Pacific Northwest
acog_district_9 <- c("CA", "HI") # Pacific West
acog_district_10 <- c("AR", "KS", "LA", "OK", "TX") # South Central
acog_district_11 <- c("MI", "NC") # Great Lakes/Southeast
# ALL US STATES AND TERRITORIES
# Source: Federal Information Processing Standards (FIPS) Publication 5-2
# URL: https://www.census.gov/library/reference/code-lists/ansi.html
# Citation: National Institute of Standards and Technology. FIPS PUB 5-2: Codes for the Identification of the States. Gaithersburg, MD: NIST; 1987.
all_states <- c("AL", "AK", "AZ", "AR", "CA", "CO", "CT", "DE", "FL", "GA",
"HI", "ID", "IL", "IN", "IA", "KS", "KY", "LA", "ME", "MD",
"MA", "MI", "MN", "MS", "MO", "MT", "NE", "NV", "NH", "NJ",
"NM", "NY", "NC", "ND", "OH", "OK", "OR", "PA", "RI", "SC",
"SD", "TN", "TX", "UT", "VT", "VA", "WA", "WV", "WI", "WY", "DC")
us_territories <- c("AS", "GU", "MP", "PR", "VI") # American Samoa, Guam, N. Mariana Islands, Puerto Rico, Virgin Islands
# STATE FIPS CODES
# Source: Federal Information Processing Standards (FIPS) Publication 5-2
# URL: https://www.census.gov/library/reference/code-lists/ansi.html
# Citation: Same as above
state_fips <- c("01", "02", "04", "05", "06", "08", "09", "10", "12", "13",
"15", "16", "17", "18", "19", "20", "21", "22", "23", "24",
"25", "26", "27", "28", "29", "30", "31", "32", "33", "34",
"35", "36", "37", "38", "39", "40", "41", "42", "44", "45",
"46", "47", "48", "49", "50", "51", "53", "54", "55", "56", "11")
# REFERENCE DATES - THIRD FRIDAY OCTOBER 9AM (2013-2023)
# Source: Project methodology decision
# Rationale: Standardized weekday morning time to avoid rush hour peaks and ensure consistency
# Citation: Muffly T. Gynecologic Oncology Accessibility Project Methodology. 2024.
reference_dates_2013_2023 <- c(
"2013-10-18", "2014-10-17", "2015-10-16", "2016-10-21", "2017-10-20",
"2018-10-19", "2019-10-18", "2020-10-16", "2021-10-15", "2022-10-21", "2023-10-20"
)
# ISO DATETIME FORMAT FOR API CALLS
# Source: ISO 8601 Standard for date/time representation
# URL: https://www.iso.org/iso-8601-date-and-time-format.html
iso_datetime_2013_2023 <- c(
"2013-10-18T09:00:00", "2014-10-17T09:00:00", "2015-10-16T09:00:00",
"2016-10-21T09:00:00", "2017-10-20T09:00:00", "2018-10-19T09:00:00",
"2019-10-18T09:00:00", "2020-10-16T09:00:00", "2021-10-15T09:00:00",
"2022-10-21T09:00:00", "2023-10-20T09:00:00"
)
# DRIVE TIME THRESHOLDS
# Source: Healthcare accessibility literature standards
# Citations:
# - Penchansky R, Thomas JW. The concept of access: definition and relationship to consumer satisfaction. Med Care. 1981;19(2):127-140.
# - Wang F, Luo W. Assessing spatial and nonspatial factors for healthcare access: towards an integrated approach to defining health professional shortage areas. Health Place. 2005;11(2):131-146.
drive_times_minutes <- c(30, 60, 120, 180)
drive_times_seconds <- c(1800, 3600, 7200, 10800) # For HERE API
# COORDINATE REFERENCE SYSTEMS (EPSG CODES)
# Source: European Petroleum Survey Group (EPSG) Geodetic Parameter Dataset
# URL: https://epsg.org/
# Citation: EPSG. EPSG Geodetic Parameter Dataset. Oil & Gas Producers Association; 2023.
epsg_wgs84 <- 4326 # WGS84 Geographic (input coordinates)
epsg_web_mercator <- 3857 # Web Mercator (web display)
epsg_us_albers <- 5070 # US Albers Equal Area (analysis)
epsg_alaska_albers <- 3338 # Alaska Albers
epsg_hawaii_albers <- 4135 # Hawaii Albers
# CENSUS VARIABLES (ACS 5-YEAR)
# Source: US Census Bureau American Community Survey
# URL: https://www.census.gov/programs-surveys/acs/guidance/subjects.html
# Publication: American Community Survey Subject Definitions
# Citation: US Census Bureau. American Community Survey Subject Definitions. Washington, DC: US Census Bureau; 2021.
census_total_population <- "B01003_001"
census_female_population <- "B01001_026"
census_white_alone <- "B03002_003"
census_black_alone <- "B03002_004"
census_asian_alone <- "B03002_006"
census_aian_alone <- "B03002_005" # American Indian/Alaska Native
census_median_income <- "B19013_001"
census_housing_units <- "B25001_001"
# HERE API ENDPOINTS
# Source: HERE Technologies Developer Documentation
# URL: https://developer.here.com/documentation/
# Citation: HERE Technologies. HERE Platform Developer Guide. Eindhoven, Netherlands: HERE; 2023.
here_geocoding_url <- "https://geocoder.ls.hereapi.com/6.2/geocode.json"
here_reverse_geocoding_url <- "https://reverse.geocoder.ls.hereapi.com/6.2/reversegeocode.json"
here_isoline_url <- "https://isoline.route.ls.hereapi.com/routing/7.2/calculateisoline.json"
# HERE API PARAMETERS
# Source: HERE Routing API Documentation
# URL: https://developer.here.com/documentation/routing-api/dev_guide/topics/resource-calculate-isoline.html
here_isoline_mode <- "car"
here_isoline_traffic <- "enabled"
here_isoline_rangetype <- "time"
here_isoline_resolution <- 1 # Highest resolution
here_isoline_maxpoints <- 1000 # Maximum polygon points
here_isoline_quality <- 1 # Highest quality
# US TIMEZONES
# Source: Internet Assigned Numbers Authority (IANA) Time Zone Database
# URL: https://www.iana.org/time-zones
# Citation: IANA. Time Zone Database. Internet Assigned Numbers Authority; 2023.
us_timezones <- c("America/New_York", "America/Chicago", "America/Denver",
"America/Los_Angeles", "America/Anchorage", "Pacific/Honolulu")
timezone_names <- c("Eastern", "Central", "Mountain", "Pacific", "Alaska", "Hawaii")
# MAJOR METROPOLITAN AREAS (CBSAs)
# Source: Office of Management and Budget
# URL: https://www.whitehouse.gov/omb/management/office-federal-financial-management/
# Publication: OMB Bulletin No. 20-01 (March 6, 2020)
# Citation: Office of Management and Budget. Revised Delineations of Metropolitan Statistical Areas, Micropolitan Statistical Areas, and Combined Statistical Areas. Washington, DC: OMB; 2020.
major_cbsa_codes <- c("35620", "31080", "16980", "19100", "26420", "33460", "37980",
"40140", "41860", "47900", "12060", "14460", "41740", "38060")
major_msa_names <- c(
"New York-Newark-Jersey City, NY-NJ-PA",
"Los Angeles-Long Beach-Anaheim, CA",
"Chicago-Naperville-Elgin, IL-IN-WI",
"Dallas-Fort Worth-Arlington, TX",
"Houston-The Woodlands-Sugar Land, TX",
"Miami-Fort Lauderdale-West Palm Beach, FL",
"Philadelphia-Camden-Wilmington, PA-NJ-DE-MD",
"Riverside-San Bernardino-Ontario, CA",
"San Francisco-Oakland-Hayward, CA",
"Washington-Arlington-Alexandria, DC-VA-MD-WV",
"Atlanta-Sandy Springs-Roswell, GA",
"Boston-Cambridge-Newton, MA-NH",
"San Antonio-New Braunfels, TX",
"Phoenix-Mesa-Scottsdale, AZ"
)
# MAJOR INTERSTATE HIGHWAYS
# Source: Federal Highway Administration
# URL: https://www.fhwa.dot.gov/planning/national_highway_system/
# Publication: National Highway System
# Citation: Federal Highway Administration. National Highway System. Washington, DC: US Department of Transportation; 2023.
# East-West Interstates
interstate_east_west <- c("I-10", "I-20", "I-30", "I-40", "I-70", "I-80", "I-90")
# North-South Interstates
interstate_north_south <- c("I-5", "I-15", "I-25", "I-35", "I-65", "I-75", "I-85", "I-95")
# All Major Interstates
all_major_interstates <- c(interstate_east_west, interstate_north_south)
# VALIDATION THRESHOLDS
# Source: Project quality control standards based on literature review
# Citations:
# - Baldwin LM, et al. Access to specialty health care for rural American Indians in the northwest. Med Care. 2008;46(12):1218-1224.
# - Onega T, et al. Geographic access to cancer care in the U.S. Cancer. 2008;112(4):909-918.
min_provider_count <- 40000 # Minimum NPPES providers expected
min_gyn_onc_count <- 1000 # Minimum gynecologic oncologists
min_geocoding_success <- 0.85 # Minimum geocoding success rate
min_isochrone_success <- 0.90 # Minimum isochrone generation success
min_population_coverage <- 0.95 # Minimum census population coverage
# QUALITY CONTROL RANGES
# Source: US Geological Survey Geographic Names Information System
# URL: https://geonames.usgs.gov/domestic/
# Citation: US Geological Survey. Geographic Names Information System. Reston, VA: USGS; 2023.
max_coordinate_lat <- 71.5 # Northernmost US point (Alaska)
min_coordinate_lat <- 18.9 # Southernmost US point (Hawaii)
max_coordinate_lon <- -66.9 # Easternmost US point (Maine)
min_coordinate_lon <- -179.1 # Westernmost US point (Alaska)
# CENSUS GEOGRAPHY COUNTS (2020 Census)
# Source: US Census Bureau Geography Division
# URL: https://www.census.gov/geographies/reference-files/2020/geo/tallies/
# Publication: 2020 Census Geographic Tallies
# Citation: US Census Bureau. 2020 Census Geographic Tallies. Washington, DC: US Census Bureau; 2021.
census_2020_states <- 51 # 50 states + DC
census_2020_counties <- 3143 # Total counties
census_2020_tracts <- 84414 # Census tracts
census_2020_block_groups <- 242335 # Block groups
# API RATE LIMITS
# Source: HERE Technologies Developer Portal
# URL: https://developer.here.com/pricing
# Current as of: 2023
here_geocoding_free_limit <- 30000 # Per month
here_isoline_free_limit <- 2500 # Per month
census_api_daily_limit <- 500 # Without API key
# DIRECTORY STRUCTURE
# Source: Project organization standards following best practices
# Citation: Wilson G, et al. Good enough practices in scientific computing. PLoS Comput Biol. 2017;13(6):e1005510.
dir_data_raw <- "data/raw/"
dir_data_processed <- "data/processed/"
dir_data_geocoded <- "data/geocoded/"
dir_data_spatial <- "data/spatial/"
dir_results <- "results/"
dir_figures <- "figures/"
dir_cache <- "cache/"