# Load data sets.

hh <- read.csv("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\hhpub.csv")

trip <-read.csv("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\trippub.csv")

#merge the household and trip data sets

x <-merge(hh,trip)

head(x)
##    HOUSEID TRAVDAY HOMEOWN HHSIZE HHVEHCNT HHFAMINC DRVRCNT HHSTATE HHSTFIPS
## 1 30000007       2       1      3        5        7       3      NC       37
## 2 30000007       2       1      3        5        7       3      NC       37
## 3 30000007       2       1      3        5        7       3      NC       37
## 4 30000007       2       1      3        5        7       3      NC       37
## 5 30000007       2       1      3        5        7       3      NC       37
## 6 30000007       2       1      3        5        7       3      NC       37
##   NUMADLT WRKCOUNT TDAYDATE HHRESP LIF_CYC MSACAT MSASIZE RAIL URBAN URBANSIZE
## 1       3        1   201608      1      10      3       1    2     1         1
## 2       3        1   201608      1      10      3       1    2     1         1
## 3       3        1   201608      1      10      3       1    2     1         1
## 4       3        1   201608      1      10      3       1    2     1         1
## 5       3        1   201608      1      10      3       1    2     1         1
## 6       3        1   201608      1      10      3       1    2     1         1
##   URBRUR CENSUS_D CENSUS_R CDIVMSAR HH_RACE HH_HISP HH_CBSA SMPLSRCE SAMPSTRAT
## 1      1        5        3       53       2       2   XXXXX        2         3
## 2      1        5        3       53       2       2   XXXXX        2         3
## 3      1        5        3       53       2       2   XXXXX        2         3
## 4      1        5        3       53       2       2   XXXXX        2         3
## 5      1        5        3       53       2       2   XXXXX        2         3
## 6      1        5        3       53       2       2   XXXXX        2         3
##   PC SPHONE TAB WALK BIKE CAR TAXI BUS TRAIN PARA PRICE PLACE WALK2SAVE
## 1  2      1   2    5    5   1    5   4     5    5     1     2         4
## 2  2      1   2    5    5   1    5   4     5    5     1     2         4
## 3  2      1   2    5    5   1    5   4     5    5     1     2         4
## 4  2      1   2    5    5   1    5   4     5    5     1     2         4
## 5  2      1   2    5    5   1    5   4     5    5     1     2         4
## 6  2      1   2    5    5   1    5   4     5    5     1     2         4
##   BIKE2SAVE PTRANS HHRELATD CNTTDHH YOUNGCHILD SCRESP RESP_CNT WEBUSE17
## 1         4      4        1       6          0      1        3        1
## 2         4      4        1       6          0      1        3        1
## 3         4      4        1       6          0      1        3        1
## 4         4      4        1       6          0      1        3        1
## 5         4      4        1       6          0      1        3        1
## 6         4      4        1       6          0      1        3        1
##    WTHHFIN HBHUR HTHTNRNT HTPPOPDN HTRESDN HTEEMPDN HBHTNRNT HBPPOPDN HBRESDN
## 1 187.3143     T       50     1500     750      750       20      750     300
## 2 187.3143     T       50     1500     750      750       20      750     300
## 3 187.3143     T       50     1500     750      750       20      750     300
## 4 187.3143     T       50     1500     750      750       20      750     300
## 5 187.3143     T       50     1500     750      750       20      750     300
## 6 187.3143     T       50     1500     750      750       20      750     300
##   PERSONID TDTRPNUM STRTTIME ENDTIME TRVLCMIN TRPMILES TRPTRANS TRPACCMP
## 1        1        1     1000    1015       15    5.244        3        0
## 2        1        2     1510    1530       20    5.149        3        0
## 3        2        1      700     900      120   84.004        6        0
## 4        2        2     1800    2030      150   81.628        6        0
## 5        3        1      845     900       15    2.250        3        0
## 6        3        2     1430    1445       15    2.243        3        0
##   TRPHHACC VEHID TRWAITTM NUMTRANS TRACCTM DROP_PRK TREGRTM WHODROVE WHYFROM
## 1        0     3       -1       -1      -1       -1      -1        1       1
## 2        0     3       -1       -1      -1       -1      -1        1      19
## 3        0     5       -1       -1      -1       -1      -1        2       3
## 4        0     5       -1       -1      -1       -1      -1        2       1
## 5        0     1       -1       -1      -1       -1      -1        3       1
## 6        0     1       -1       -1      -1       -1      -1        3       8
##   LOOP_TRIP TRPHHVEH HHMEMDRV HH_ONTD NONHHCNT NUMONTRP PSGR_FLG PUBTRANS
## 1         2        1        1       1        0        1        2        2
## 2         2        1        1       1        0        1        2        2
## 3         2        1        1       1        0        1        2        2
## 4         2        1        1       1        0        1        2        2
## 5         2        1        1       1        0        1        2        2
## 6         2        1        1       1        0        1        2        2
##   TRIPPURP DWELTIME TDWKND VMT_MILE DRVR_FLG WHYTRP1S ONTD_P1 ONTD_P2 ONTD_P3
## 1      HBO      295      2    5.244        1       20       1       2       2
## 2      HBO       -9      2    5.149        1        1       1       2       2
## 3      HBW      540      2   84.004        1        1       2       1       2
## 4      HBW       -9      2   81.628        1       10       2       1       2
## 5      HBO      330      2    2.250        1       20       2       2       1
## 6      HBO       -9      2    2.243        1        1       2       2       1
##   ONTD_P4 ONTD_P5 ONTD_P6 ONTD_P7 ONTD_P8 ONTD_P9 ONTD_P10 ONTD_P11 ONTD_P12
## 1      -1      -1      -1      -1      -1      -1       -1       -1       -1
## 2      -1      -1      -1      -1      -1      -1       -1       -1       -1
## 3      -1      -1      -1      -1      -1      -1       -1       -1       -1
## 4      -1      -1      -1      -1      -1      -1       -1       -1       -1
## 5      -1      -1      -1      -1      -1      -1       -1       -1       -1
## 6      -1      -1      -1      -1      -1      -1       -1       -1       -1
##   ONTD_P13     TDCASEID TRACC_WLK TRACC_POV TRACC_BUS TRACC_CRL TRACC_SUB
## 1       -1 300000070101        -1        -1        -1        -1        -1
## 2       -1 300000070102        -1        -1        -1        -1        -1
## 3       -1 300000070201        -1        -1        -1        -1        -1
## 4       -1 300000070202        -1        -1        -1        -1        -1
## 5       -1 300000070301        -1        -1        -1        -1        -1
## 6       -1 300000070302        -1        -1        -1        -1        -1
##   TRACC_OTH TREGR_WLK TREGR_POV TREGR_BUS TREGR_CRL TREGR_SUB TREGR_OTH WHYTO
## 1        -1        -1        -1        -1        -1        -1        -1    19
## 2        -1        -1        -1        -1        -1        -1        -1     1
## 3        -1        -1        -1        -1        -1        -1        -1     1
## 4        -1        -1        -1        -1        -1        -1        -1     3
## 5        -1        -1        -1        -1        -1        -1        -1     8
## 6        -1        -1        -1        -1        -1        -1        -1     1
##   GASPRICE R_AGE EDUC R_SEX PRMACT PROXY WORKER DRIVER WTTRDFIN WHYTRP90
## 1    228.4    67    3     2      6     1      2      1 75441.91        5
## 2    228.4    67    3     2      6     1      2      1 75441.91        5
## 3    228.4    66    3     1      1     2      1      1 71932.65        1
## 4    228.4    66    3     1      1     2      1      1 71932.65        1
## 5    228.4    28    2     2      5     2      2      1 80122.69        5
## 6    228.4    28    2     2      5     2      2      1 80122.69        5
##    TRPMILAD R_AGE_IMP R_SEX_IMP VEHTYPE OBHUR DBHUR OTHTNRNT OTPPOPDN OTRESDN
## 1  5.847584        67         2       1     T     T       50     1500     750
## 2  5.741650        67         2       1     T     T       50      750     300
## 3 90.178294        66         1       4     S     T       40     1500     750
## 4 87.627658        66         1       4     T     S       50     1500     750
## 5  2.508975        28         2       1     T     T       50     1500     750
## 6  2.501169        28         2       1     T     T       50      750     300
##   OTEEMPDN OBHTNRNT OBPPOPDN OBRESDN DTHTNRNT DTPPOPDN DTRESDN DTEEMPDN
## 1      750       20      750     300       50      750     300      350
## 2      350       30      300     300       50     1500     750      750
## 3      750       40     1500     750       50     1500     750      750
## 4      750       20      750     300       40     1500     750      750
## 5      750       20      750     300       50      750     300      350
## 6      350       60      750     300       50     1500     750      750
##   DBHTNRNT DBPPOPDN DBRESDN
## 1       30      300     300
## 2       20      750     300
## 3       20      750     300
## 4       40     1500     750
## 5       60      750     300
## 6       20      750     300
#subset of Vermont data records

vt <- subset(x,HHSTATE =="VT")

head(vt)
##       HOUSEID TRAVDAY HOMEOWN HHSIZE HHVEHCNT HHFAMINC DRVRCNT HHSTATE HHSTFIPS
## 1811 30002242       7       1      3        2       10       2      VT       50
## 1812 30002242       7       1      3        2       10       2      VT       50
## 1813 30002242       7       1      3        2       10       2      VT       50
## 1814 30002242       7       1      3        2       10       2      VT       50
## 1815 30002242       7       1      3        2       10       2      VT       50
## 1816 30002242       7       1      3        2       10       2      VT       50
##      NUMADLT WRKCOUNT TDAYDATE HHRESP LIF_CYC MSACAT MSASIZE RAIL URBAN
## 1811       2        1   201608      1       6      3       1    2     1
## 1812       2        1   201608      1       6      3       1    2     1
## 1813       2        1   201608      1       6      3       1    2     1
## 1814       2        1   201608      1       6      3       1    2     1
## 1815       2        1   201608      1       6      3       1    2     1
## 1816       2        1   201608      1       6      3       1    2     1
##      URBANSIZE URBRUR CENSUS_D CENSUS_R CDIVMSAR HH_RACE HH_HISP HH_CBSA
## 1811         1      1        1        1       13       1       2   XXXXX
## 1812         1      1        1        1       13       1       2   XXXXX
## 1813         1      1        1        1       13       1       2   XXXXX
## 1814         1      1        1        1       13       1       2   XXXXX
## 1815         1      1        1        1       13       1       2   XXXXX
## 1816         1      1        1        1       13       1       2   XXXXX
##      SMPLSRCE SAMPSTRAT PC SPHONE TAB WALK BIKE CAR TAXI BUS TRAIN PARA PRICE
## 1811        1         3  1      1   3    1    3   1    4   5     5    5     2
## 1812        1         3  1      1   3    1    3   1    4   5     5    5     2
## 1813        1         3  1      1   3    1    3   1    4   5     5    5     2
## 1814        1         3  1      1   3    1    3   1    4   5     5    5     2
## 1815        1         3  1      1   3    1    3   1    4   5     5    5     2
## 1816        1         3  1      1   3    1    3   1    4   5     5    5     2
##      PLACE WALK2SAVE BIKE2SAVE PTRANS HHRELATD CNTTDHH YOUNGCHILD SCRESP
## 1811     3         4         4      4        1       9          0      1
## 1812     3         4         4      4        1       9          0      1
## 1813     3         4         4      4        1       9          0      1
## 1814     3         4         4      4        1       9          0      1
## 1815     3         4         4      4        1       9          0      1
## 1816     3         4         4      4        1       9          0      1
##      RESP_CNT WEBUSE17  WTHHFIN HBHUR HTHTNRNT HTPPOPDN HTRESDN HTEEMPDN
## 1811        3        1 407.8716     T       30     3000    1500     1500
## 1812        3        1 407.8716     T       30     3000    1500     1500
## 1813        3        1 407.8716     T       30     3000    1500     1500
## 1814        3        1 407.8716     T       30     3000    1500     1500
## 1815        3        1 407.8716     T       30     3000    1500     1500
## 1816        3        1 407.8716     T       30     3000    1500     1500
##      HBHTNRNT HBPPOPDN HBRESDN PERSONID TDTRPNUM STRTTIME ENDTIME TRVLCMIN
## 1811        5     3000    1500        1        1      700     800       60
## 1812        5     3000    1500        1        2     1430    1545       75
## 1813        5     3000    1500        1        3     2200    2250       50
## 1814        5     3000    1500        2        1      920     940       20
## 1815        5     3000    1500        2        2     1315    1335       20
## 1816        5     3000    1500        2        3     1430    1455       25
##      TRPMILES TRPTRANS TRPACCMP TRPHHACC VEHID TRWAITTM NUMTRANS TRACCTM
## 1811    1.222        1        1        0    -1       -1       -1      -1
## 1812    2.000        1        1        0    -1       -1       -1      -1
## 1813    0.889        1        1        0    -1       -1       -1      -1
## 1814    4.228        4        0        0     1       -1       -1      -1
## 1815    4.259        4        0        0     1       -1       -1      -1
## 1816    7.995        4        1        1     1       -1       -1      -1
##      DROP_PRK TREGRTM WHODROVE WHYFROM LOOP_TRIP TRPHHVEH HHMEMDRV HH_ONTD
## 1811       -1      -1       -1       1         1        2       -1       1
## 1812       -1      -1       -1       1         1        2       -1       1
## 1813       -1      -1       -1       1         1        2       -1       1
## 1814       -1      -1        2       1         2        1        1       1
## 1815       -1      -1        2       5         2        1        1       1
## 1816       -1      -1        2       1         2        1        1       2
##      NONHHCNT NUMONTRP PSGR_FLG PUBTRANS TRIPPURP DWELTIME TDWKND VMT_MILE
## 1811        1        2       -1        2      HBO      390      1   -1.000
## 1812        1        2       -1        2      HBO      375      1   -1.000
## 1813        1        2       -1        2      HBO       -9      1   -1.000
## 1814        0        1        2        2      HBO      215      1    4.228
## 1815        0        1        2        2      HBO       55      1    4.259
## 1816        0        2        2        2   HBSHOP      140      1    7.995
##      DRVR_FLG WHYTRP1S ONTD_P1 ONTD_P2 ONTD_P3 ONTD_P4 ONTD_P5 ONTD_P6 ONTD_P7
## 1811       -1        1       1       2       2      -1      -1      -1      -1
## 1812       -1        1       1       2       2      -1      -1      -1      -1
## 1813       -1        1       1       2       2      -1      -1      -1      -1
## 1814        1       97       2       1       2      -1      -1      -1      -1
## 1815        1        1       2       1       2      -1      -1      -1      -1
## 1816        1       40       2       1       1      -1      -1      -1      -1
##      ONTD_P8 ONTD_P9 ONTD_P10 ONTD_P11 ONTD_P12 ONTD_P13     TDCASEID TRACC_WLK
## 1811      -1      -1       -1       -1       -1       -1 300022420101        -1
## 1812      -1      -1       -1       -1       -1       -1 300022420102        -1
## 1813      -1      -1       -1       -1       -1       -1 300022420103        -1
## 1814      -1      -1       -1       -1       -1       -1 300022420201        -1
## 1815      -1      -1       -1       -1       -1       -1 300022420202        -1
## 1816      -1      -1       -1       -1       -1       -1 300022420203        -1
##      TRACC_POV TRACC_BUS TRACC_CRL TRACC_SUB TRACC_OTH TREGR_WLK TREGR_POV
## 1811        -1        -1        -1        -1        -1        -1        -1
## 1812        -1        -1        -1        -1        -1        -1        -1
## 1813        -1        -1        -1        -1        -1        -1        -1
## 1814        -1        -1        -1        -1        -1        -1        -1
## 1815        -1        -1        -1        -1        -1        -1        -1
## 1816        -1        -1        -1        -1        -1        -1        -1
##      TREGR_BUS TREGR_CRL TREGR_SUB TREGR_OTH WHYTO GASPRICE R_AGE EDUC R_SEX
## 1811        -1        -1        -1        -1     1    223.7    58    5     1
## 1812        -1        -1        -1        -1     1    223.7    58    5     1
## 1813        -1        -1        -1        -1     1    223.7    58    5     1
## 1814        -1        -1        -1        -1     5    223.7    52    3     2
## 1815        -1        -1        -1        -1     1    223.7    52    3     2
## 1816        -1        -1        -1        -1    11    223.7    52    3     2
##      PRMACT PROXY WORKER DRIVER WTTRDFIN WHYTRP90 TRPMILAD R_AGE_IMP R_SEX_IMP
## 1811      1     1      1      1 161532.5       10 1.222000        58         1
## 1812      1     1      1      1 161532.5       10 2.000000        58         1
## 1813      1     1      1      1 161532.5       10 0.889000        58         1
## 1814      4     1      2      1 138311.3        4 4.714643        52         2
## 1815      4     1      2      1 138311.3        4 4.749211        52         2
## 1816      4     1      2      1 138311.3        3 8.915225        52         2
##      VEHTYPE OBHUR DBHUR OTHTNRNT OTPPOPDN OTRESDN OTEEMPDN OBHTNRNT OBPPOPDN
## 1811      -1     T     T       30     3000    1500     1500        5     3000
## 1812      -1     T     T       30     3000    1500     1500        5     3000
## 1813      -1     T     T       30     3000    1500     1500        5     3000
## 1814       3     T     S       30     3000    1500     1500        5     3000
## 1815       3     S     T       30      300     300      150       70     7000
## 1816       3     T     S       30     3000    1500     1500        5     3000
##      OBRESDN DTHTNRNT DTPPOPDN DTRESDN DTEEMPDN DBHTNRNT DBPPOPDN DBRESDN
## 1811    1500       30     3000    1500     1500        5     3000    1500
## 1812    1500       30     3000    1500     1500        5     3000    1500
## 1813    1500       30     3000    1500     1500        5     3000    1500
## 1814    1500       30      300     300      150       70     7000    1500
## 1815    1500       30     3000    1500     1500        5     3000    1500
## 1816    1500       40     3000    1500     1500       50     1500     750
library(readxl)

IncCodes=read_excel("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\Income Codes.xlsx")

TripCodes=read_excel("C:\\Users\\amuchene\\Downloads\\R training\\R training\\WS2\\Trip Codes.xlsx")

vt = merge(vt, IncCodes)

vt = merge(vt, TripCodes)

#create new data.frame with just the data we need

vt2=data.frame(vt$HHINC, vt$TRIPPUR, vt$TRPMILES)

#rename the columns to better organize things

names(vt2) = c("Income", "Trip_Purpose", "Miles")

head(vt2)
##                 Income Trip_Purpose  Miles
## 1         I don't know         Home 26.935
## 2 $125,000 to $149,999         Home  3.402
## 3   $50,000 to $74,999         Home  2.695
## 4         I don't know         Home  1.143
## 5         I don't know         Home  2.844
## 6   $35,000 to $49,999         Home  0.677