# Load data sets.
hh <- read.csv("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\hhpub.csv")
trip <-read.csv("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\trippub.csv")
#merge the household and trip data sets
x <-merge(hh,trip)
head(x)
## HOUSEID TRAVDAY HOMEOWN HHSIZE HHVEHCNT HHFAMINC DRVRCNT HHSTATE HHSTFIPS
## 1 30000007 2 1 3 5 7 3 NC 37
## 2 30000007 2 1 3 5 7 3 NC 37
## 3 30000007 2 1 3 5 7 3 NC 37
## 4 30000007 2 1 3 5 7 3 NC 37
## 5 30000007 2 1 3 5 7 3 NC 37
## 6 30000007 2 1 3 5 7 3 NC 37
## NUMADLT WRKCOUNT TDAYDATE HHRESP LIF_CYC MSACAT MSASIZE RAIL URBAN URBANSIZE
## 1 3 1 201608 1 10 3 1 2 1 1
## 2 3 1 201608 1 10 3 1 2 1 1
## 3 3 1 201608 1 10 3 1 2 1 1
## 4 3 1 201608 1 10 3 1 2 1 1
## 5 3 1 201608 1 10 3 1 2 1 1
## 6 3 1 201608 1 10 3 1 2 1 1
## URBRUR CENSUS_D CENSUS_R CDIVMSAR HH_RACE HH_HISP HH_CBSA SMPLSRCE SAMPSTRAT
## 1 1 5 3 53 2 2 XXXXX 2 3
## 2 1 5 3 53 2 2 XXXXX 2 3
## 3 1 5 3 53 2 2 XXXXX 2 3
## 4 1 5 3 53 2 2 XXXXX 2 3
## 5 1 5 3 53 2 2 XXXXX 2 3
## 6 1 5 3 53 2 2 XXXXX 2 3
## PC SPHONE TAB WALK BIKE CAR TAXI BUS TRAIN PARA PRICE PLACE WALK2SAVE
## 1 2 1 2 5 5 1 5 4 5 5 1 2 4
## 2 2 1 2 5 5 1 5 4 5 5 1 2 4
## 3 2 1 2 5 5 1 5 4 5 5 1 2 4
## 4 2 1 2 5 5 1 5 4 5 5 1 2 4
## 5 2 1 2 5 5 1 5 4 5 5 1 2 4
## 6 2 1 2 5 5 1 5 4 5 5 1 2 4
## BIKE2SAVE PTRANS HHRELATD CNTTDHH YOUNGCHILD SCRESP RESP_CNT WEBUSE17
## 1 4 4 1 6 0 1 3 1
## 2 4 4 1 6 0 1 3 1
## 3 4 4 1 6 0 1 3 1
## 4 4 4 1 6 0 1 3 1
## 5 4 4 1 6 0 1 3 1
## 6 4 4 1 6 0 1 3 1
## WTHHFIN HBHUR HTHTNRNT HTPPOPDN HTRESDN HTEEMPDN HBHTNRNT HBPPOPDN HBRESDN
## 1 187.3143 T 50 1500 750 750 20 750 300
## 2 187.3143 T 50 1500 750 750 20 750 300
## 3 187.3143 T 50 1500 750 750 20 750 300
## 4 187.3143 T 50 1500 750 750 20 750 300
## 5 187.3143 T 50 1500 750 750 20 750 300
## 6 187.3143 T 50 1500 750 750 20 750 300
## PERSONID TDTRPNUM STRTTIME ENDTIME TRVLCMIN TRPMILES TRPTRANS TRPACCMP
## 1 1 1 1000 1015 15 5.244 3 0
## 2 1 2 1510 1530 20 5.149 3 0
## 3 2 1 700 900 120 84.004 6 0
## 4 2 2 1800 2030 150 81.628 6 0
## 5 3 1 845 900 15 2.250 3 0
## 6 3 2 1430 1445 15 2.243 3 0
## TRPHHACC VEHID TRWAITTM NUMTRANS TRACCTM DROP_PRK TREGRTM WHODROVE WHYFROM
## 1 0 3 -1 -1 -1 -1 -1 1 1
## 2 0 3 -1 -1 -1 -1 -1 1 19
## 3 0 5 -1 -1 -1 -1 -1 2 3
## 4 0 5 -1 -1 -1 -1 -1 2 1
## 5 0 1 -1 -1 -1 -1 -1 3 1
## 6 0 1 -1 -1 -1 -1 -1 3 8
## LOOP_TRIP TRPHHVEH HHMEMDRV HH_ONTD NONHHCNT NUMONTRP PSGR_FLG PUBTRANS
## 1 2 1 1 1 0 1 2 2
## 2 2 1 1 1 0 1 2 2
## 3 2 1 1 1 0 1 2 2
## 4 2 1 1 1 0 1 2 2
## 5 2 1 1 1 0 1 2 2
## 6 2 1 1 1 0 1 2 2
## TRIPPURP DWELTIME TDWKND VMT_MILE DRVR_FLG WHYTRP1S ONTD_P1 ONTD_P2 ONTD_P3
## 1 HBO 295 2 5.244 1 20 1 2 2
## 2 HBO -9 2 5.149 1 1 1 2 2
## 3 HBW 540 2 84.004 1 1 2 1 2
## 4 HBW -9 2 81.628 1 10 2 1 2
## 5 HBO 330 2 2.250 1 20 2 2 1
## 6 HBO -9 2 2.243 1 1 2 2 1
## ONTD_P4 ONTD_P5 ONTD_P6 ONTD_P7 ONTD_P8 ONTD_P9 ONTD_P10 ONTD_P11 ONTD_P12
## 1 -1 -1 -1 -1 -1 -1 -1 -1 -1
## 2 -1 -1 -1 -1 -1 -1 -1 -1 -1
## 3 -1 -1 -1 -1 -1 -1 -1 -1 -1
## 4 -1 -1 -1 -1 -1 -1 -1 -1 -1
## 5 -1 -1 -1 -1 -1 -1 -1 -1 -1
## 6 -1 -1 -1 -1 -1 -1 -1 -1 -1
## ONTD_P13 TDCASEID TRACC_WLK TRACC_POV TRACC_BUS TRACC_CRL TRACC_SUB
## 1 -1 300000070101 -1 -1 -1 -1 -1
## 2 -1 300000070102 -1 -1 -1 -1 -1
## 3 -1 300000070201 -1 -1 -1 -1 -1
## 4 -1 300000070202 -1 -1 -1 -1 -1
## 5 -1 300000070301 -1 -1 -1 -1 -1
## 6 -1 300000070302 -1 -1 -1 -1 -1
## TRACC_OTH TREGR_WLK TREGR_POV TREGR_BUS TREGR_CRL TREGR_SUB TREGR_OTH WHYTO
## 1 -1 -1 -1 -1 -1 -1 -1 19
## 2 -1 -1 -1 -1 -1 -1 -1 1
## 3 -1 -1 -1 -1 -1 -1 -1 1
## 4 -1 -1 -1 -1 -1 -1 -1 3
## 5 -1 -1 -1 -1 -1 -1 -1 8
## 6 -1 -1 -1 -1 -1 -1 -1 1
## GASPRICE R_AGE EDUC R_SEX PRMACT PROXY WORKER DRIVER WTTRDFIN WHYTRP90
## 1 228.4 67 3 2 6 1 2 1 75441.91 5
## 2 228.4 67 3 2 6 1 2 1 75441.91 5
## 3 228.4 66 3 1 1 2 1 1 71932.65 1
## 4 228.4 66 3 1 1 2 1 1 71932.65 1
## 5 228.4 28 2 2 5 2 2 1 80122.69 5
## 6 228.4 28 2 2 5 2 2 1 80122.69 5
## TRPMILAD R_AGE_IMP R_SEX_IMP VEHTYPE OBHUR DBHUR OTHTNRNT OTPPOPDN OTRESDN
## 1 5.847584 67 2 1 T T 50 1500 750
## 2 5.741650 67 2 1 T T 50 750 300
## 3 90.178294 66 1 4 S T 40 1500 750
## 4 87.627658 66 1 4 T S 50 1500 750
## 5 2.508975 28 2 1 T T 50 1500 750
## 6 2.501169 28 2 1 T T 50 750 300
## OTEEMPDN OBHTNRNT OBPPOPDN OBRESDN DTHTNRNT DTPPOPDN DTRESDN DTEEMPDN
## 1 750 20 750 300 50 750 300 350
## 2 350 30 300 300 50 1500 750 750
## 3 750 40 1500 750 50 1500 750 750
## 4 750 20 750 300 40 1500 750 750
## 5 750 20 750 300 50 750 300 350
## 6 350 60 750 300 50 1500 750 750
## DBHTNRNT DBPPOPDN DBRESDN
## 1 30 300 300
## 2 20 750 300
## 3 20 750 300
## 4 40 1500 750
## 5 60 750 300
## 6 20 750 300
#subset of Vermont data records
vt <- subset(x,HHSTATE =="VT")
head(vt)
## HOUSEID TRAVDAY HOMEOWN HHSIZE HHVEHCNT HHFAMINC DRVRCNT HHSTATE HHSTFIPS
## 1811 30002242 7 1 3 2 10 2 VT 50
## 1812 30002242 7 1 3 2 10 2 VT 50
## 1813 30002242 7 1 3 2 10 2 VT 50
## 1814 30002242 7 1 3 2 10 2 VT 50
## 1815 30002242 7 1 3 2 10 2 VT 50
## 1816 30002242 7 1 3 2 10 2 VT 50
## NUMADLT WRKCOUNT TDAYDATE HHRESP LIF_CYC MSACAT MSASIZE RAIL URBAN
## 1811 2 1 201608 1 6 3 1 2 1
## 1812 2 1 201608 1 6 3 1 2 1
## 1813 2 1 201608 1 6 3 1 2 1
## 1814 2 1 201608 1 6 3 1 2 1
## 1815 2 1 201608 1 6 3 1 2 1
## 1816 2 1 201608 1 6 3 1 2 1
## URBANSIZE URBRUR CENSUS_D CENSUS_R CDIVMSAR HH_RACE HH_HISP HH_CBSA
## 1811 1 1 1 1 13 1 2 XXXXX
## 1812 1 1 1 1 13 1 2 XXXXX
## 1813 1 1 1 1 13 1 2 XXXXX
## 1814 1 1 1 1 13 1 2 XXXXX
## 1815 1 1 1 1 13 1 2 XXXXX
## 1816 1 1 1 1 13 1 2 XXXXX
## SMPLSRCE SAMPSTRAT PC SPHONE TAB WALK BIKE CAR TAXI BUS TRAIN PARA PRICE
## 1811 1 3 1 1 3 1 3 1 4 5 5 5 2
## 1812 1 3 1 1 3 1 3 1 4 5 5 5 2
## 1813 1 3 1 1 3 1 3 1 4 5 5 5 2
## 1814 1 3 1 1 3 1 3 1 4 5 5 5 2
## 1815 1 3 1 1 3 1 3 1 4 5 5 5 2
## 1816 1 3 1 1 3 1 3 1 4 5 5 5 2
## PLACE WALK2SAVE BIKE2SAVE PTRANS HHRELATD CNTTDHH YOUNGCHILD SCRESP
## 1811 3 4 4 4 1 9 0 1
## 1812 3 4 4 4 1 9 0 1
## 1813 3 4 4 4 1 9 0 1
## 1814 3 4 4 4 1 9 0 1
## 1815 3 4 4 4 1 9 0 1
## 1816 3 4 4 4 1 9 0 1
## RESP_CNT WEBUSE17 WTHHFIN HBHUR HTHTNRNT HTPPOPDN HTRESDN HTEEMPDN
## 1811 3 1 407.8716 T 30 3000 1500 1500
## 1812 3 1 407.8716 T 30 3000 1500 1500
## 1813 3 1 407.8716 T 30 3000 1500 1500
## 1814 3 1 407.8716 T 30 3000 1500 1500
## 1815 3 1 407.8716 T 30 3000 1500 1500
## 1816 3 1 407.8716 T 30 3000 1500 1500
## HBHTNRNT HBPPOPDN HBRESDN PERSONID TDTRPNUM STRTTIME ENDTIME TRVLCMIN
## 1811 5 3000 1500 1 1 700 800 60
## 1812 5 3000 1500 1 2 1430 1545 75
## 1813 5 3000 1500 1 3 2200 2250 50
## 1814 5 3000 1500 2 1 920 940 20
## 1815 5 3000 1500 2 2 1315 1335 20
## 1816 5 3000 1500 2 3 1430 1455 25
## TRPMILES TRPTRANS TRPACCMP TRPHHACC VEHID TRWAITTM NUMTRANS TRACCTM
## 1811 1.222 1 1 0 -1 -1 -1 -1
## 1812 2.000 1 1 0 -1 -1 -1 -1
## 1813 0.889 1 1 0 -1 -1 -1 -1
## 1814 4.228 4 0 0 1 -1 -1 -1
## 1815 4.259 4 0 0 1 -1 -1 -1
## 1816 7.995 4 1 1 1 -1 -1 -1
## DROP_PRK TREGRTM WHODROVE WHYFROM LOOP_TRIP TRPHHVEH HHMEMDRV HH_ONTD
## 1811 -1 -1 -1 1 1 2 -1 1
## 1812 -1 -1 -1 1 1 2 -1 1
## 1813 -1 -1 -1 1 1 2 -1 1
## 1814 -1 -1 2 1 2 1 1 1
## 1815 -1 -1 2 5 2 1 1 1
## 1816 -1 -1 2 1 2 1 1 2
## NONHHCNT NUMONTRP PSGR_FLG PUBTRANS TRIPPURP DWELTIME TDWKND VMT_MILE
## 1811 1 2 -1 2 HBO 390 1 -1.000
## 1812 1 2 -1 2 HBO 375 1 -1.000
## 1813 1 2 -1 2 HBO -9 1 -1.000
## 1814 0 1 2 2 HBO 215 1 4.228
## 1815 0 1 2 2 HBO 55 1 4.259
## 1816 0 2 2 2 HBSHOP 140 1 7.995
## DRVR_FLG WHYTRP1S ONTD_P1 ONTD_P2 ONTD_P3 ONTD_P4 ONTD_P5 ONTD_P6 ONTD_P7
## 1811 -1 1 1 2 2 -1 -1 -1 -1
## 1812 -1 1 1 2 2 -1 -1 -1 -1
## 1813 -1 1 1 2 2 -1 -1 -1 -1
## 1814 1 97 2 1 2 -1 -1 -1 -1
## 1815 1 1 2 1 2 -1 -1 -1 -1
## 1816 1 40 2 1 1 -1 -1 -1 -1
## ONTD_P8 ONTD_P9 ONTD_P10 ONTD_P11 ONTD_P12 ONTD_P13 TDCASEID TRACC_WLK
## 1811 -1 -1 -1 -1 -1 -1 300022420101 -1
## 1812 -1 -1 -1 -1 -1 -1 300022420102 -1
## 1813 -1 -1 -1 -1 -1 -1 300022420103 -1
## 1814 -1 -1 -1 -1 -1 -1 300022420201 -1
## 1815 -1 -1 -1 -1 -1 -1 300022420202 -1
## 1816 -1 -1 -1 -1 -1 -1 300022420203 -1
## TRACC_POV TRACC_BUS TRACC_CRL TRACC_SUB TRACC_OTH TREGR_WLK TREGR_POV
## 1811 -1 -1 -1 -1 -1 -1 -1
## 1812 -1 -1 -1 -1 -1 -1 -1
## 1813 -1 -1 -1 -1 -1 -1 -1
## 1814 -1 -1 -1 -1 -1 -1 -1
## 1815 -1 -1 -1 -1 -1 -1 -1
## 1816 -1 -1 -1 -1 -1 -1 -1
## TREGR_BUS TREGR_CRL TREGR_SUB TREGR_OTH WHYTO GASPRICE R_AGE EDUC R_SEX
## 1811 -1 -1 -1 -1 1 223.7 58 5 1
## 1812 -1 -1 -1 -1 1 223.7 58 5 1
## 1813 -1 -1 -1 -1 1 223.7 58 5 1
## 1814 -1 -1 -1 -1 5 223.7 52 3 2
## 1815 -1 -1 -1 -1 1 223.7 52 3 2
## 1816 -1 -1 -1 -1 11 223.7 52 3 2
## PRMACT PROXY WORKER DRIVER WTTRDFIN WHYTRP90 TRPMILAD R_AGE_IMP R_SEX_IMP
## 1811 1 1 1 1 161532.5 10 1.222000 58 1
## 1812 1 1 1 1 161532.5 10 2.000000 58 1
## 1813 1 1 1 1 161532.5 10 0.889000 58 1
## 1814 4 1 2 1 138311.3 4 4.714643 52 2
## 1815 4 1 2 1 138311.3 4 4.749211 52 2
## 1816 4 1 2 1 138311.3 3 8.915225 52 2
## VEHTYPE OBHUR DBHUR OTHTNRNT OTPPOPDN OTRESDN OTEEMPDN OBHTNRNT OBPPOPDN
## 1811 -1 T T 30 3000 1500 1500 5 3000
## 1812 -1 T T 30 3000 1500 1500 5 3000
## 1813 -1 T T 30 3000 1500 1500 5 3000
## 1814 3 T S 30 3000 1500 1500 5 3000
## 1815 3 S T 30 300 300 150 70 7000
## 1816 3 T S 30 3000 1500 1500 5 3000
## OBRESDN DTHTNRNT DTPPOPDN DTRESDN DTEEMPDN DBHTNRNT DBPPOPDN DBRESDN
## 1811 1500 30 3000 1500 1500 5 3000 1500
## 1812 1500 30 3000 1500 1500 5 3000 1500
## 1813 1500 30 3000 1500 1500 5 3000 1500
## 1814 1500 30 300 300 150 70 7000 1500
## 1815 1500 30 3000 1500 1500 5 3000 1500
## 1816 1500 40 3000 1500 1500 50 1500 750
library(readxl)
IncCodes=read_excel("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\Income Codes.xlsx")
TripCodes=read_excel("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\Trip Codes.xlsx")
vt = merge(vt, IncCodes)
vt = merge(vt, TripCodes)
#create new data.frame with just the data we need
vt2=data.frame(vt$HHINC, vt$TRIPPUR, vt$TRPMILES)
#rename the columns to better organize things
names(vt2) = c("Income", "Trip_Purpose", "Miles")
head(vt2)
## Income Trip_Purpose Miles
## 1 I don't know Home 26.935
## 2 $125,000 to $149,999 Home 3.402
## 3 $50,000 to $74,999 Home 2.695
## 4 I don't know Home 1.143
## 5 I don't know Home 2.844
## 6 $35,000 to $49,999 Home 0.677