US Census data: population data. Visulizing some facts about the demographics in the US: http://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMSDataDict13.txt
setwd("C:\\Users\\Minerva\\Dropbox\\Desk2015\\Rwork-Datascience\\US_census\\pums")
#Population data of states 1-26
a=read.csv("ss13pusa.csv")
attach(a)
head(a)
## RT SERIALNO SPORDER PUMA ST ADJINC PWGTP AGEP CIT CITWP COW DDRS DEAR
## 1 P 84 1 2600 1 1007549 65 19 1 NA NA 2 2
## 2 P 154 1 2500 1 1007549 51 55 1 NA 1 2 2
## 3 P 154 2 2500 1 1007549 62 56 1 NA 6 2 2
## 4 P 154 3 2500 1 1007549 232 21 1 NA NA 2 2
## 5 P 154 4 2500 1 1007549 97 21 1 NA NA 1 2
## 6 P 156 1 1700 1 1007549 449 63 1 NA 3 2 2
## DEYE DOUT DPHY DRAT DRATX DREM ENG FER GCL GCM GCR HINS1 HINS2 HINS3
## 1 2 2 2 NA NA 2 NA 2 NA NA NA 1 2 2
## 2 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## 3 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## 4 2 2 2 NA NA 2 NA NA NA NA NA 1 2 2
## 5 2 1 1 NA NA 2 NA 2 NA NA NA 1 2 2
## 6 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## HINS4 HINS5 HINS6 HINS7 INTP JWMNP JWRIP JWTR LANX MAR MARHD MARHM MARHT
## 1 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 2 2 2 2 2 0 30 1 1 2 1 2 2 1
## 3 2 2 2 2 0 NA NA 11 2 1 2 2 1
## 4 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 5 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 6 2 2 2 2 0 15 1 1 2 3 2 2 1
## MARHW MARHYP MIG MIL MLPA MLPB MLPCD MLPE MLPFG MLPH MLPI MLPJ MLPK NWAB
## 1 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 2 2 1990 1 4 NA NA NA NA NA NA NA NA NA 3
## 3 2 1990 1 4 NA NA NA NA NA NA NA NA NA 3
## 4 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 5 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 6 2 1972 1 4 NA NA NA NA NA NA NA NA NA 3
## NWAV NWLA NWLK NWRE OIP PAP RELP RETP SCH SCHG SCHL SEMP SEX SSIP SSP
## 1 5 2 2 3 0 0 17 0 2 15 19 0 2 0 0
## 2 5 3 3 3 0 0 0 0 1 NA 20 0 2 0 0
## 3 5 3 3 3 0 0 1 0 1 NA 16 99000 1 0 0
## 4 5 2 2 3 0 0 2 0 2 15 19 0 1 0 0
## 5 5 2 2 3 0 0 2 0 2 15 19 0 2 0 0
## 6 5 3 3 3 0 0 0 0 1 NA 21 0 2 0 930
## WAGP WKHP WKL WKW WRK YOEP ANC ANC1P ANC2P DECADE DIS DRIVESP ESP ESR
## 1 0 NA 3 NA 2 NA 4 999 999 NA 2 NA NA 6
## 2 52000 40 1 1 1 NA 1 902 999 NA 2 1 NA 1
## 3 0 40 1 1 1 NA 1 902 999 NA 2 NA NA 1
## 4 0 NA 3 NA 2 NA 1 902 999 NA 2 NA NA 6
## 5 0 NA 3 NA 2 NA 1 902 999 NA 1 NA NA 6
## 6 39000 40 1 1 1 NA 1 902 999 NA 2 1 NA 1
## FOD1P FOD2P HICOV HISP INDP JWAP JWDP LANP MIGPUMA MIGSP MSP NAICSP
## 1 NA NA 1 1 NA NA NA NA NA NA 6
## 2 NA NA 1 1 5380 100 55 NA NA NA 1 45211
## 3 NA NA 1 1 8880 NA NA NA NA NA 1 8114
## 4 NA NA 1 1 NA NA NA NA NA NA 6
## 5 NA NA 1 1 NA NA NA NA NA NA 6
## 6 6107 NA 1 1 7860 109 67 NA NA NA 4 6111
## NATIVITY NOP OC OCCP PAOC PERNP PINCP POBP POVPIP POWPUMA POWSP PRIVCOV
## 1 1 NA 0 NA NA 0 0 28 NA NA NA 1
## 2 1 NA 0 4700 4 52000 52000 1 501 2500 1 1
## 3 1 NA 0 7240 NA 99000 99000 1 501 2500 1 1
## 4 1 NA 0 NA NA 0 0 1 501 NA NA 1
## 5 1 NA 0 NA 4 0 0 1 501 NA NA 1
## 6 1 NA 0 2310 4 39000 39930 1 330 1700 1 1
## PUBCOV QTRBIR RAC1P RAC2P RAC3P RACAIAN RACASN RACBLK RACNH RACNUM RACPI
## 1 2 1 1 1 1 0 0 0 0 1 0
## 2 2 1 2 2 2 0 0 1 0 1 0
## 3 2 4 2 2 2 0 0 1 0 1 0
## 4 2 4 2 2 2 0 0 1 0 1 0
## 5 2 4 2 2 2 0 0 1 0 1 0
## 6 2 3 2 2 2 0 0 1 0 1 0
## RACSOR RACWHT RC SCIENGP SCIENGRLP SFN SFR SOCP VPS WAOB FAGEP FANCP
## 1 0 1 0 NA NA NA NA NA 1 0 0
## 2 0 0 0 NA NA NA NA 411011 NA 1 0 0
## 3 0 0 0 NA NA NA NA 493050 NA 1 0 0
## 4 0 0 0 NA NA NA NA NA 1 0 0
## 5 0 0 0 NA NA NA NA NA 1 0 0
## 6 0 0 0 2 1 NA NA 252020 NA 1 0 0
## FCITP FCITWP FCOWP FDDRSP FDEARP FDEYEP FDISP FDOUTP FDPHYP FDRATP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 0 0 1 0 0 0 0 0 0 0
## FDRATXP FDREMP FENGP FESRP FFERP FFODP FGCLP FGCMP FGCRP FHINS1P FHINS2P
## 1 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 0 0 0 0 0 0 0
## FHINS3C FHINS3P FHINS4C FHINS4P FHINS5C FHINS5P FHINS6P FHINS7P FHISP
## 1 NA 0 NA 0 NA 0 0 0 0
## 2 NA 0 NA 0 NA 0 0 0 0
## 3 NA 0 NA 0 NA 0 0 0 0
## 4 NA 0 NA 0 NA 0 0 0 0
## 5 NA 0 NA 0 NA 0 0 0 0
## 6 NA 0 NA 0 NA 0 0 0 0
## FINDP FINTP FJWDP FJWMNP FJWRIP FJWTRP FLANP FLANXP FMARHDP FMARHMP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 1 1 1 1 0 0 0 0 1 0
## FMARHTP FMARHWP FMARHYP FMARP FMIGP FMIGSP FMILPP FMILSP FOCCP FOIP FPAP
## 1 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0
## 6 0 1 1 1 0 0 0 0 1 1 1
## FPERNP FPINCP FPOBP FPOWSP FPRIVCOVP FPUBCOVP FRACP FRELP FRETP FSCHGP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 1 1 0 0 0 0 0 0 0 0
## 3 1 1 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 1 1 0 0 0 0 0 0 1 0
## FSCHLP FSCHP FSEMP FSEXP FSSIP FSSP FWAGP FWKHP FWKLP FWKWP FWRKP FYOEP
## 1 0 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 1 0 0 0 0 0
## 3 0 0 1 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 1 0 1 1 1 1 1 1 0 0
## pwgtp1 pwgtp2 pwgtp3 pwgtp4 pwgtp5 pwgtp6 pwgtp7 pwgtp8 pwgtp9 pwgtp10
## 1 5 127 65 66 69 5 120 66 63 5
## 2 45 51 53 50 100 79 78 50 19 57
## 3 66 67 60 66 108 106 102 63 21 72
## 4 244 211 224 187 368 324 335 239 63 321
## 5 106 97 87 92 162 146 184 110 30 99
## 6 481 575 807 739 153 173 722 455 158 671
## pwgtp11 pwgtp12 pwgtp13 pwgtp14 pwgtp15 pwgtp16 pwgtp17 pwgtp18 pwgtp19
## 1 67 6 5 137 124 65 66 64 63
## 2 89 46 67 109 50 18 17 18 46
## 3 107 53 74 133 61 19 22 17 54
## 4 299 211 209 412 230 63 93 75 279
## 5 127 90 110 177 113 29 29 26 95
## 6 681 469 402 118 339 436 443 393 161
## pwgtp20 pwgtp21 pwgtp22 pwgtp23 pwgtp24 pwgtp25 pwgtp26 pwgtp27 pwgtp28
## 1 6 131 6 62 63 60 126 6 66
## 2 88 49 50 49 65 13 16 16 54
## 3 102 57 55 54 69 19 18 20 69
## 4 308 206 309 230 281 66 76 128 300
## 5 187 102 110 78 107 29 31 35 109
## 6 411 467 387 127 150 553 514 133 613
## pwgtp29 pwgtp30 pwgtp31 pwgtp32 pwgtp33 pwgtp34 pwgtp35 pwgtp36 pwgtp37
## 1 68 120 66 126 115 5 5 63 66
## 2 85 48 14 49 50 11 56 83 71
## 3 101 66 20 60 58 17 58 107 91
## 4 421 167 68 296 221 71 264 393 294
## 5 145 114 29 99 83 37 101 154 155
## 6 562 151 196 431 576 710 378 481 504
## pwgtp38 pwgtp39 pwgtp40 pwgtp41 pwgtp42 pwgtp43 pwgtp44 pwgtp45 pwgtp46
## 1 66 62 5 118 6 64 66 62 124
## 2 108 54 81 43 52 50 63 17 15
## 3 114 64 104 70 66 58 72 19 16
## 4 305 193 372 274 222 261 236 110 65
## 5 132 109 161 115 114 83 125 32 22
## 6 530 760 409 560 403 638 516 100 150
## pwgtp47 pwgtp48 pwgtp49 pwgtp50 pwgtp51 pwgtp52 pwgtp53 pwgtp54 pwgtp55
## 1 6 63 68 132 62 119 126 6 5
## 2 15 47 88 47 13 51 52 20 53
## 3 21 68 111 58 19 59 57 18 63
## 4 63 235 343 246 77 197 228 73 228
## 5 39 107 133 129 32 98 93 40 93
## 6 660 454 179 793 723 450 528 168 355
## pwgtp56 pwgtp57 pwgtp58 pwgtp59 pwgtp60 pwgtp61 pwgtp62 pwgtp63 pwgtp64
## 1 68 72 65 66 125 5 123 62 64
## 2 84 78 75 53 15 55 55 58 65
## 3 97 87 93 68 19 59 71 65 73
## 4 339 349 359 262 68 193 283 230 230
## 5 145 150 126 129 38 102 106 95 120
## 6 445 465 426 228 575 386 433 166 230
## pwgtp65 pwgtp66 pwgtp67 pwgtp68 pwgtp69 pwgtp70 pwgtp71 pwgtp72 pwgtp73
## 1 65 6 123 65 67 6 68 6 5
## 2 110 82 90 50 12 55 87 52 60
## 3 126 94 102 61 20 60 96 57 70
## 4 313 355 441 278 76 151 346 259 248
## 5 141 131 174 104 31 123 186 84 87
## 6 797 571 155 556 596 170 162 530 602
## pwgtp74 pwgtp75 pwgtp76 pwgtp77 pwgtp78 pwgtp79 pwgtp80
## 1 127 119 63 68 67 64 122
## 2 84 50 15 15 20 50 16
## 3 116 60 17 21 19 58 18
## 4 422 284 91 68 72 195 94
## 5 180 88 25 25 23 101 36
## 6 579 341 378 387 421 621 486
nrow(a)
## [1] 1613672
#Population data of states 26-50
b=read.csv("ss13pusb.csv")
attach(b)
## The following objects are masked from a:
##
## ADJINC, AGEP, ANC, ANC1P, ANC2P, CIT, CITWP, COW, DDRS, DEAR,
## DECADE, DEYE, DIS, DOUT, DPHY, DRAT, DRATX, DREM, DRIVESP,
## ENG, ESP, ESR, FAGEP, FANCP, FCITP, FCITWP, FCOWP, FDDRSP,
## FDEARP, FDEYEP, FDISP, FDOUTP, FDPHYP, FDRATP, FDRATXP,
## FDREMP, FENGP, FER, FESRP, FFERP, FFODP, FGCLP, FGCMP, FGCRP,
## FHINS1P, FHINS2P, FHINS3C, FHINS3P, FHINS4C, FHINS4P, FHINS5C,
## FHINS5P, FHINS6P, FHINS7P, FHISP, FINDP, FINTP, FJWDP, FJWMNP,
## FJWRIP, FJWTRP, FLANP, FLANXP, FMARHDP, FMARHMP, FMARHTP,
## FMARHWP, FMARHYP, FMARP, FMIGP, FMIGSP, FMILPP, FMILSP, FOCCP,
## FOD1P, FOD2P, FOIP, FPAP, FPERNP, FPINCP, FPOBP, FPOWSP,
## FPRIVCOVP, FPUBCOVP, FRACP, FRELP, FRETP, FSCHGP, FSCHLP,
## FSCHP, FSEMP, FSEXP, FSSIP, FSSP, FWAGP, FWKHP, FWKLP, FWKWP,
## FWRKP, FYOEP, GCL, GCM, GCR, HICOV, HINS1, HINS2, HINS3,
## HINS4, HINS5, HINS6, HINS7, HISP, INDP, INTP, JWAP, JWDP,
## JWMNP, JWRIP, JWTR, LANP, LANX, MAR, MARHD, MARHM, MARHT,
## MARHW, MARHYP, MIG, MIGPUMA, MIGSP, MIL, MLPA, MLPB, MLPCD,
## MLPE, MLPFG, MLPH, MLPI, MLPJ, MLPK, MSP, NAICSP, NATIVITY,
## NOP, NWAB, NWAV, NWLA, NWLK, NWRE, OC, OCCP, OIP, PAOC, PAP,
## PERNP, PINCP, POBP, POVPIP, POWPUMA, POWSP, PRIVCOV, PUBCOV,
## PUMA, PWGTP, pwgtp1, pwgtp10, pwgtp11, pwgtp12, pwgtp13,
## pwgtp14, pwgtp15, pwgtp16, pwgtp17, pwgtp18, pwgtp19, pwgtp2,
## pwgtp20, pwgtp21, pwgtp22, pwgtp23, pwgtp24, pwgtp25, pwgtp26,
## pwgtp27, pwgtp28, pwgtp29, pwgtp3, pwgtp30, pwgtp31, pwgtp32,
## pwgtp33, pwgtp34, pwgtp35, pwgtp36, pwgtp37, pwgtp38, pwgtp39,
## pwgtp4, pwgtp40, pwgtp41, pwgtp42, pwgtp43, pwgtp44, pwgtp45,
## pwgtp46, pwgtp47, pwgtp48, pwgtp49, pwgtp5, pwgtp50, pwgtp51,
## pwgtp52, pwgtp53, pwgtp54, pwgtp55, pwgtp56, pwgtp57, pwgtp58,
## pwgtp59, pwgtp6, pwgtp60, pwgtp61, pwgtp62, pwgtp63, pwgtp64,
## pwgtp65, pwgtp66, pwgtp67, pwgtp68, pwgtp69, pwgtp7, pwgtp70,
## pwgtp71, pwgtp72, pwgtp73, pwgtp74, pwgtp75, pwgtp76, pwgtp77,
## pwgtp78, pwgtp79, pwgtp8, pwgtp80, pwgtp9, QTRBIR, RAC1P,
## RAC2P, RAC3P, RACAIAN, RACASN, RACBLK, RACNH, RACNUM, RACPI,
## RACSOR, RACWHT, RC, RELP, RETP, RT, SCH, SCHG, SCHL, SCIENGP,
## SCIENGRLP, SEMP, SERIALNO, SEX, SFN, SFR, SOCP, SPORDER, SSIP,
## SSP, ST, VPS, WAGP, WAOB, WKHP, WKL, WKW, WRK, YOEP
head(b)
## RT SERIALNO SPORDER PUMA ST ADJINC PWGTP AGEP CIT CITWP COW DDRS DEAR
## 1 P 76 1 1802 29 1007549 229 21 1 NA 1 2 2
## 2 P 76 2 1802 29 1007549 278 22 1 NA 1 2 2
## 3 P 80 1 901 29 1007549 26 21 1 NA NA 2 2
## 4 P 86 1 1600 29 1007549 161 58 1 NA 1 2 2
## 5 P 86 2 1600 29 1007549 120 52 1 NA 6 2 2
## 6 P 192 1 901 29 1007549 123 46 1 NA 1 2 2
## DEYE DOUT DPHY DRAT DRATX DREM ENG FER GCL GCM GCR HINS1 HINS2 HINS3
## 1 2 2 2 NA NA 2 NA NA NA NA NA 1 2 2
## 2 2 2 2 NA NA 2 NA NA NA NA NA 1 2 2
## 3 2 2 2 NA NA 2 NA 2 NA NA NA 1 2 2
## 4 2 2 1 NA 2 2 NA NA 2 NA NA 2 2 1
## 5 2 2 2 NA NA 2 NA NA 2 NA NA 2 1 2
## 6 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## HINS4 HINS5 HINS6 HINS7 INTP JWMNP JWRIP JWTR LANX MAR MARHD MARHM MARHT
## 1 2 2 2 2 0 20 1 1 2 5 NA NA NA
## 2 2 2 2 2 0 20 1 1 2 5 NA NA NA
## 3 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 4 2 2 1 2 0 NA NA NA 2 1 2 2 2
## 5 2 2 2 2 0 20 1 1 2 1 2 2 2
## 6 2 2 2 2 350 50 1 1 2 1 2 2 1
## MARHW MARHYP MIG MIL MLPA MLPB MLPCD MLPE MLPFG MLPH MLPI MLPJ MLPK NWAB
## 1 NA NA 1 4 NA NA NA NA NA NA NA NA NA 3
## 2 NA NA 1 4 NA NA NA NA NA NA NA NA NA 3
## 3 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 4 2 2009 1 2 0 0 0 1 0 0 0 0 0 2
## 5 2 2009 1 4 NA NA NA NA NA NA NA NA NA 3
## 6 2 1997 1 4 NA NA NA NA NA NA NA NA NA 3
## NWAV NWLA NWLK NWRE OIP PAP RELP RETP SCH SCHG SCHL SEMP SEX SSIP SSP
## 1 5 3 3 3 0 0 0 0 2 15 19 0 1 0 0
## 2 5 3 3 3 0 0 12 0 2 15 19 0 1 0 0
## 3 5 2 2 3 0 0 17 0 3 15 19 0 2 0 0
## 4 5 2 2 3 0 0 0 0 1 NA 21 0 1 0 16000
## 5 5 3 3 3 0 0 1 0 1 NA 22 60000 2 0 0
## 6 5 3 3 3 0 0 0 0 1 NA 21 0 1 0 0
## WAGP WKHP WKL WKW WRK YOEP ANC ANC1P ANC2P DECADE DIS DRIVESP ESP ESR
## 1 20400 40 1 1 1 NA 1 902 999 NA 2 1 NA 1
## 2 16700 20 1 1 1 NA 1 902 999 NA 2 1 NA 1
## 3 0 NA 3 NA 2 NA 1 51 999 NA 2 NA NA 6
## 4 0 NA 2 NA 2 NA 1 22 999 NA 1 NA NA 6
## 5 0 50 1 1 1 NA 1 32 999 NA 2 1 NA 1
## 6 65000 40 1 1 1 NA 3 996 999 NA 2 1 NA 1
## FOD1P FOD2P HICOV HISP INDP JWAP JWDP LANP MIGPUMA MIGSP MSP NAICSP
## 1 NA NA 1 1 8660 194 115 NA NA NA 6 7211
## 2 NA NA 1 1 5090 86 43 NA NA NA 6 447
## 3 NA NA 1 1 NA NA NA NA NA NA 6
## 4 6203 NA 1 1 8770 NA NA NA NA NA 1 8111Z
## 5 6203 NA 1 1 7280 230 133 NA NA NA 1 5412
## 6 6203 NA 1 1 5790 92 43 NA NA NA 1 4MS
## NATIVITY NOP OC OCCP PAOC PERNP PINCP POBP POVPIP POWPUMA POWSP PRIVCOV
## 1 1 NA 0 5120 NA 20400 20400 29 170 1900 29 1
## 2 1 NA 0 4720 NA 16700 16700 29 139 1800 29 1
## 3 1 NA 0 NA NA 0 0 20 NA NA NA 1
## 4 1 NA 0 5860 NA 0 16000 29 490 NA NA 2
## 5 1 NA 0 800 4 60000 60000 29 490 1800 29 1
## 6 1 NA 0 800 NA 65000 65350 20 501 600 20 1
## PUBCOV QTRBIR RAC1P RAC2P RAC3P RACAIAN RACASN RACBLK RACNH RACNUM RACPI
## 1 2 1 2 2 2 0 0 1 0 1 0
## 2 2 4 2 2 2 0 0 1 0 1 0
## 3 2 1 1 1 1 0 0 0 0 1 0
## 4 1 1 1 1 1 0 0 0 0 1 0
## 5 2 3 1 1 1 0 0 0 0 1 0
## 6 2 2 1 1 1 0 0 0 0 1 0
## RACSOR RACWHT RC SCIENGP SCIENGRLP SFN SFR SOCP VPS WAOB FAGEP FANCP
## 1 0 0 0 NA NA NA NA 433031 NA 1 0 0
## 2 0 0 0 NA NA NA NA 412010 NA 1 0 0
## 3 0 1 0 NA NA NA NA NA 1 0 0
## 4 0 1 0 2 2 NA NA 439061 6 1 0 0
## 5 0 1 0 2 2 NA NA 132011 NA 1 0 0
## 6 0 1 0 2 2 NA NA 132011 NA 1 0 0
## FCITP FCITWP FCOWP FDDRSP FDEARP FDEYEP FDISP FDOUTP FDPHYP FDRATP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 0 0 0 0 0 0
## FDRATXP FDREMP FENGP FESRP FFERP FFODP FGCLP FGCMP FGCRP FHINS1P FHINS2P
## 1 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 1 0
## 3 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 0 0 0 0 0 0 0
## FHINS3C FHINS3P FHINS4C FHINS4P FHINS5C FHINS5P FHINS6P FHINS7P FHISP
## 1 NA 0 NA 0 NA 0 0 0 0
## 2 NA 0 NA 0 NA 0 0 0 0
## 3 NA 0 NA 0 NA 0 0 0 0
## 4 0 0 NA 0 NA 0 0 0 0
## 5 NA 0 NA 0 NA 0 0 0 0
## 6 NA 1 NA 1 NA 1 1 1 0
## FINDP FINTP FJWDP FJWMNP FJWRIP FJWTRP FLANP FLANXP FMARHDP FMARHMP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 0 0 1 0 0 0 0 0 0 0
## FMARHTP FMARHWP FMARHYP FMARP FMIGP FMIGSP FMILPP FMILSP FOCCP FOIP FPAP
## 1 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 0 0 0 0 0 0 0
## FPERNP FPINCP FPOBP FPOWSP FPRIVCOVP FPUBCOVP FRACP FRELP FRETP FSCHGP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 1 1 0 0 1 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 1 1 0 0 0 0
## FSCHLP FSCHP FSEMP FSEXP FSSIP FSSP FWAGP FWKHP FWKLP FWKWP FWRKP FYOEP
## 1 0 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 1 1 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 0 0 0 0 0 0 0 0
## pwgtp1 pwgtp2 pwgtp3 pwgtp4 pwgtp5 pwgtp6 pwgtp7 pwgtp8 pwgtp9 pwgtp10
## 1 383 64 431 340 212 211 85 69 326 167
## 2 438 70 482 465 249 279 104 92 395 221
## 3 47 25 46 4 25 47 49 26 26 27
## 4 158 52 55 48 160 275 183 57 148 140
## 5 139 33 37 27 122 187 114 43 123 114
## 6 120 117 37 224 34 109 198 213 212 113
## pwgtp11 pwgtp12 pwgtp13 pwgtp14 pwgtp15 pwgtp16 pwgtp17 pwgtp18 pwgtp19
## 1 192 243 353 251 292 202 84 281 273
## 2 232 295 431 291 313 266 96 324 342
## 3 26 25 4 26 47 4 25 4 25
## 4 45 137 231 287 303 143 134 172 163
## 5 38 114 215 196 234 89 113 131 100
## 6 44 201 120 128 110 122 37 38 129
## pwgtp20 pwgtp21 pwgtp22 pwgtp23 pwgtp24 pwgtp25 pwgtp26 pwgtp27 pwgtp28
## 1 76 419 83 435 359 241 205 52 74
## 2 92 484 100 515 429 280 245 70 87
## 3 4 47 27 47 4 27 47 53 27
## 4 283 135 46 50 57 155 271 183 48
## 5 190 106 42 34 33 103 216 128 39
## 6 37 35 234 132 123 115 195 116 145
## pwgtp29 pwgtp30 pwgtp31 pwgtp32 pwgtp33 pwgtp34 pwgtp35 pwgtp36 pwgtp37
## 1 327 286 306 253 434 227 216 229 71
## 2 463 319 350 330 504 277 286 290 86
## 3 27 28 25 27 4 26 47 5 27
## 4 147 154 46 157 237 226 301 178 143
## 5 135 131 36 94 242 173 236 113 102
## 6 134 38 139 129 213 33 189 218 122
## pwgtp38 pwgtp39 pwgtp40 pwgtp41 pwgtp42 pwgtp43 pwgtp44 pwgtp45 pwgtp46
## 1 190 217 352 86 396 93 67 260 197
## 2 237 278 425 104 464 99 100 295 277
## 3 4 27 4 48 25 47 3 26 50
## 4 172 167 53 158 297 274 272 150 40
## 5 140 129 39 102 210 269 161 104 31
## 6 134 45 137 102 140 215 40 210 136
## pwgtp47 pwgtp48 pwgtp49 pwgtp50 pwgtp51 pwgtp52 pwgtp53 pwgtp54 pwgtp55
## 1 433 411 53 183 234 175 76 242 232
## 2 492 466 64 254 242 229 83 282 294
## 3 46 27 27 26 26 26 4 26 49
## 4 183 354 158 162 245 171 43 40 63
## 5 128 245 132 112 229 107 38 31 30
## 6 41 34 35 120 220 38 122 115 122
## pwgtp56 pwgtp57 pwgtp58 pwgtp59 pwgtp60 pwgtp61 pwgtp62 pwgtp63 pwgtp64
## 1 234 402 258 250 446 78 386 72 68
## 2 324 460 307 326 536 89 498 90 79
## 3 4 26 4 25 4 47 25 49 4
## 4 155 145 170 141 60 117 269 269 279
## 5 96 117 156 132 39 95 215 182 197
## 6 149 193 216 114 211 220 42 148 139
## pwgtp65 pwgtp66 pwgtp67 pwgtp68 pwgtp69 pwgtp70 pwgtp71 pwgtp72 pwgtp73
## 1 215 205 368 399 72 300 246 231 89
## 2 243 260 422 524 83 310 309 285 103
## 3 27 48 50 25 26 26 26 27 3
## 4 152 53 196 277 189 151 238 138 46
## 5 125 44 144 202 147 96 225 138 39
## 6 112 35 121 110 103 197 116 115 33
## pwgtp74 pwgtp75 pwgtp76 pwgtp77 pwgtp78 pwgtp79 pwgtp80
## 1 243 247 187 305 207 174 58
## 2 291 298 258 398 269 209 69
## 3 26 50 4 26 4 26 4
## 4 45 49 184 137 182 167 388
## 5 34 30 110 127 116 116 283
## 6 214 36 33 141 135 203 117
nrow(b)
## [1] 1519123
##combine the two datasets
total <- rbind(a,b) #combine data for all 26 states in 1 data frame
#nrow(total)
total$ST=as.factor(total$ST) #ST contains state codes. 1 is Alabama and so on.
class(total$ST)
## [1] "factor"
library(dplyr)
##
## Attaching package: 'dplyr'
##
## The following objects are masked from 'package:stats':
##
## filter, lag
##
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(ggplot2)
head(total)
## RT SERIALNO SPORDER PUMA ST ADJINC PWGTP AGEP CIT CITWP COW DDRS DEAR
## 1 P 84 1 2600 1 1007549 65 19 1 NA NA 2 2
## 2 P 154 1 2500 1 1007549 51 55 1 NA 1 2 2
## 3 P 154 2 2500 1 1007549 62 56 1 NA 6 2 2
## 4 P 154 3 2500 1 1007549 232 21 1 NA NA 2 2
## 5 P 154 4 2500 1 1007549 97 21 1 NA NA 1 2
## 6 P 156 1 1700 1 1007549 449 63 1 NA 3 2 2
## DEYE DOUT DPHY DRAT DRATX DREM ENG FER GCL GCM GCR HINS1 HINS2 HINS3
## 1 2 2 2 NA NA 2 NA 2 NA NA NA 1 2 2
## 2 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## 3 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## 4 2 2 2 NA NA 2 NA NA NA NA NA 1 2 2
## 5 2 1 1 NA NA 2 NA 2 NA NA NA 1 2 2
## 6 2 2 2 NA NA 2 NA NA 2 NA NA 1 2 2
## HINS4 HINS5 HINS6 HINS7 INTP JWMNP JWRIP JWTR LANX MAR MARHD MARHM MARHT
## 1 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 2 2 2 2 2 0 30 1 1 2 1 2 2 1
## 3 2 2 2 2 0 NA NA 11 2 1 2 2 1
## 4 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 5 2 2 2 2 0 NA NA NA 2 5 NA NA NA
## 6 2 2 2 2 0 15 1 1 2 3 2 2 1
## MARHW MARHYP MIG MIL MLPA MLPB MLPCD MLPE MLPFG MLPH MLPI MLPJ MLPK NWAB
## 1 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 2 2 1990 1 4 NA NA NA NA NA NA NA NA NA 3
## 3 2 1990 1 4 NA NA NA NA NA NA NA NA NA 3
## 4 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 5 NA NA 1 4 NA NA NA NA NA NA NA NA NA 2
## 6 2 1972 1 4 NA NA NA NA NA NA NA NA NA 3
## NWAV NWLA NWLK NWRE OIP PAP RELP RETP SCH SCHG SCHL SEMP SEX SSIP SSP
## 1 5 2 2 3 0 0 17 0 2 15 19 0 2 0 0
## 2 5 3 3 3 0 0 0 0 1 NA 20 0 2 0 0
## 3 5 3 3 3 0 0 1 0 1 NA 16 99000 1 0 0
## 4 5 2 2 3 0 0 2 0 2 15 19 0 1 0 0
## 5 5 2 2 3 0 0 2 0 2 15 19 0 2 0 0
## 6 5 3 3 3 0 0 0 0 1 NA 21 0 2 0 930
## WAGP WKHP WKL WKW WRK YOEP ANC ANC1P ANC2P DECADE DIS DRIVESP ESP ESR
## 1 0 NA 3 NA 2 NA 4 999 999 NA 2 NA NA 6
## 2 52000 40 1 1 1 NA 1 902 999 NA 2 1 NA 1
## 3 0 40 1 1 1 NA 1 902 999 NA 2 NA NA 1
## 4 0 NA 3 NA 2 NA 1 902 999 NA 2 NA NA 6
## 5 0 NA 3 NA 2 NA 1 902 999 NA 1 NA NA 6
## 6 39000 40 1 1 1 NA 1 902 999 NA 2 1 NA 1
## FOD1P FOD2P HICOV HISP INDP JWAP JWDP LANP MIGPUMA MIGSP MSP NAICSP
## 1 NA NA 1 1 NA NA NA NA NA NA 6
## 2 NA NA 1 1 5380 100 55 NA NA NA 1 45211
## 3 NA NA 1 1 8880 NA NA NA NA NA 1 8114
## 4 NA NA 1 1 NA NA NA NA NA NA 6
## 5 NA NA 1 1 NA NA NA NA NA NA 6
## 6 6107 NA 1 1 7860 109 67 NA NA NA 4 6111
## NATIVITY NOP OC OCCP PAOC PERNP PINCP POBP POVPIP POWPUMA POWSP PRIVCOV
## 1 1 NA 0 NA NA 0 0 28 NA NA NA 1
## 2 1 NA 0 4700 4 52000 52000 1 501 2500 1 1
## 3 1 NA 0 7240 NA 99000 99000 1 501 2500 1 1
## 4 1 NA 0 NA NA 0 0 1 501 NA NA 1
## 5 1 NA 0 NA 4 0 0 1 501 NA NA 1
## 6 1 NA 0 2310 4 39000 39930 1 330 1700 1 1
## PUBCOV QTRBIR RAC1P RAC2P RAC3P RACAIAN RACASN RACBLK RACNH RACNUM RACPI
## 1 2 1 1 1 1 0 0 0 0 1 0
## 2 2 1 2 2 2 0 0 1 0 1 0
## 3 2 4 2 2 2 0 0 1 0 1 0
## 4 2 4 2 2 2 0 0 1 0 1 0
## 5 2 4 2 2 2 0 0 1 0 1 0
## 6 2 3 2 2 2 0 0 1 0 1 0
## RACSOR RACWHT RC SCIENGP SCIENGRLP SFN SFR SOCP VPS WAOB FAGEP FANCP
## 1 0 1 0 NA NA NA NA NA 1 0 0
## 2 0 0 0 NA NA NA NA 411011 NA 1 0 0
## 3 0 0 0 NA NA NA NA 493050 NA 1 0 0
## 4 0 0 0 NA NA NA NA NA 1 0 0
## 5 0 0 0 NA NA NA NA NA 1 0 0
## 6 0 0 0 2 1 NA NA 252020 NA 1 0 0
## FCITP FCITWP FCOWP FDDRSP FDEARP FDEYEP FDISP FDOUTP FDPHYP FDRATP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 0 0 1 0 0 0 0 0 0 0
## FDRATXP FDREMP FENGP FESRP FFERP FFODP FGCLP FGCMP FGCRP FHINS1P FHINS2P
## 1 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 0 0 0 0 0 0 0 0 0
## FHINS3C FHINS3P FHINS4C FHINS4P FHINS5C FHINS5P FHINS6P FHINS7P FHISP
## 1 NA 0 NA 0 NA 0 0 0 0
## 2 NA 0 NA 0 NA 0 0 0 0
## 3 NA 0 NA 0 NA 0 0 0 0
## 4 NA 0 NA 0 NA 0 0 0 0
## 5 NA 0 NA 0 NA 0 0 0 0
## 6 NA 0 NA 0 NA 0 0 0 0
## FINDP FINTP FJWDP FJWMNP FJWRIP FJWTRP FLANP FLANXP FMARHDP FMARHMP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 1 1 1 1 0 0 0 0 1 0
## FMARHTP FMARHWP FMARHYP FMARP FMIGP FMIGSP FMILPP FMILSP FOCCP FOIP FPAP
## 1 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0
## 6 0 1 1 1 0 0 0 0 1 1 1
## FPERNP FPINCP FPOBP FPOWSP FPRIVCOVP FPUBCOVP FRACP FRELP FRETP FSCHGP
## 1 0 0 0 0 0 0 0 0 0 0
## 2 1 1 0 0 0 0 0 0 0 0
## 3 1 1 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0
## 6 1 1 0 0 0 0 0 0 1 0
## FSCHLP FSCHP FSEMP FSEXP FSSIP FSSP FWAGP FWKHP FWKLP FWKWP FWRKP FYOEP
## 1 0 0 0 0 0 0 0 0 0 0 0 0
## 2 0 0 0 0 0 0 1 0 0 0 0 0
## 3 0 0 1 0 0 0 0 0 0 0 0 0
## 4 0 0 0 0 0 0 0 0 0 0 0 0
## 5 0 0 0 0 0 0 0 0 0 0 0 0
## 6 0 0 1 0 1 1 1 1 1 1 0 0
## pwgtp1 pwgtp2 pwgtp3 pwgtp4 pwgtp5 pwgtp6 pwgtp7 pwgtp8 pwgtp9 pwgtp10
## 1 5 127 65 66 69 5 120 66 63 5
## 2 45 51 53 50 100 79 78 50 19 57
## 3 66 67 60 66 108 106 102 63 21 72
## 4 244 211 224 187 368 324 335 239 63 321
## 5 106 97 87 92 162 146 184 110 30 99
## 6 481 575 807 739 153 173 722 455 158 671
## pwgtp11 pwgtp12 pwgtp13 pwgtp14 pwgtp15 pwgtp16 pwgtp17 pwgtp18 pwgtp19
## 1 67 6 5 137 124 65 66 64 63
## 2 89 46 67 109 50 18 17 18 46
## 3 107 53 74 133 61 19 22 17 54
## 4 299 211 209 412 230 63 93 75 279
## 5 127 90 110 177 113 29 29 26 95
## 6 681 469 402 118 339 436 443 393 161
## pwgtp20 pwgtp21 pwgtp22 pwgtp23 pwgtp24 pwgtp25 pwgtp26 pwgtp27 pwgtp28
## 1 6 131 6 62 63 60 126 6 66
## 2 88 49 50 49 65 13 16 16 54
## 3 102 57 55 54 69 19 18 20 69
## 4 308 206 309 230 281 66 76 128 300
## 5 187 102 110 78 107 29 31 35 109
## 6 411 467 387 127 150 553 514 133 613
## pwgtp29 pwgtp30 pwgtp31 pwgtp32 pwgtp33 pwgtp34 pwgtp35 pwgtp36 pwgtp37
## 1 68 120 66 126 115 5 5 63 66
## 2 85 48 14 49 50 11 56 83 71
## 3 101 66 20 60 58 17 58 107 91
## 4 421 167 68 296 221 71 264 393 294
## 5 145 114 29 99 83 37 101 154 155
## 6 562 151 196 431 576 710 378 481 504
## pwgtp38 pwgtp39 pwgtp40 pwgtp41 pwgtp42 pwgtp43 pwgtp44 pwgtp45 pwgtp46
## 1 66 62 5 118 6 64 66 62 124
## 2 108 54 81 43 52 50 63 17 15
## 3 114 64 104 70 66 58 72 19 16
## 4 305 193 372 274 222 261 236 110 65
## 5 132 109 161 115 114 83 125 32 22
## 6 530 760 409 560 403 638 516 100 150
## pwgtp47 pwgtp48 pwgtp49 pwgtp50 pwgtp51 pwgtp52 pwgtp53 pwgtp54 pwgtp55
## 1 6 63 68 132 62 119 126 6 5
## 2 15 47 88 47 13 51 52 20 53
## 3 21 68 111 58 19 59 57 18 63
## 4 63 235 343 246 77 197 228 73 228
## 5 39 107 133 129 32 98 93 40 93
## 6 660 454 179 793 723 450 528 168 355
## pwgtp56 pwgtp57 pwgtp58 pwgtp59 pwgtp60 pwgtp61 pwgtp62 pwgtp63 pwgtp64
## 1 68 72 65 66 125 5 123 62 64
## 2 84 78 75 53 15 55 55 58 65
## 3 97 87 93 68 19 59 71 65 73
## 4 339 349 359 262 68 193 283 230 230
## 5 145 150 126 129 38 102 106 95 120
## 6 445 465 426 228 575 386 433 166 230
## pwgtp65 pwgtp66 pwgtp67 pwgtp68 pwgtp69 pwgtp70 pwgtp71 pwgtp72 pwgtp73
## 1 65 6 123 65 67 6 68 6 5
## 2 110 82 90 50 12 55 87 52 60
## 3 126 94 102 61 20 60 96 57 70
## 4 313 355 441 278 76 151 346 259 248
## 5 141 131 174 104 31 123 186 84 87
## 6 797 571 155 556 596 170 162 530 602
## pwgtp74 pwgtp75 pwgtp76 pwgtp77 pwgtp78 pwgtp79 pwgtp80
## 1 127 119 63 68 67 64 122
## 2 84 50 15 15 20 50 16
## 3 116 60 17 21 19 58 18
## 4 422 284 91 68 72 195 94
## 5 180 88 25 25 23 101 36
## 6 579 341 378 387 421 621 486
## States by US citizens
t=total %>%group_by(ST) %>% summarize(citl=sum(CIT==1)) # CIT is code for citizenship and 1 is for citizens
#plot(t$citl~t$ST)
ggplot(data=t, aes(x=ST, y=citl, fill=ST)) +geom_bar(stat="identity")+xlab("States")+ylab("US Citizens")
# States with people born in Guam,PR
t2=total %>%group_by(ST) %>% summarize(citl=sum(CIT==2)) # CIT is code for citizenship and 2 is for people born in Guam
ggplot(data=t2, aes(x=ST, y=citl, fill=ST)) +geom_bar(stat="identity")+xlab("States")+ylab("People born in Guam etc")
# States with people born abroad to American parents
t3=total %>%group_by(ST) %>% summarize(citl=sum(CIT==3)) # CIT is code for citizenship and 3 is for people born
#abroad to US parents
ggplot(data=t3, aes(x=ST, y=citl, fill=ST)) +geom_bar(stat="identity")+xlab("States")+ylab("People born abroad to American parents")
# States with naturalized American people
t4=total %>%group_by(ST) %>% summarize(citl=sum(CIT==4)) # CIT is code for citizenship and 4 is for people naturalized
ggplot(data=t4, aes(x=ST, y=citl, fill=ST)) +geom_bar(stat="identity")+xlab("States")+ylab("Naturalized American people")
An analysis of the citizenship data above reveals that #5 or Arkansas has the highest number of population of US citizens and naturalized Americans. Second highest number of naturalized Americans can be found in Delware
Examine self care difficulty or DDRS (1=yes and 2=no)
## States by self care difficulties
d=total %>%group_by(ST) %>% summarize(yes=sum(DDRS==1,na.rm=TRUE)) # DDRS is code for self care issues and 1 is for yes
ggplot(data=d, aes(x=ST, y=yes, fill=ST)) +geom_bar(stat="identity")+xlab("States")+ylab("People with self care difficulties")
d2=total %>%group_by(ST) %>% summarize(no=sum(DDRS==2,na.rm=TRUE)) # DDRS is code for self care issues and 2 is for no
head(d2)
## Source: local data frame [6 x 2]
##
## ST no
## (fctr) (int)
## 1 1 43184
## 2 2 6083
## 3 4 60626
## 4 5 26750
## 5 6 338819
## 6 8 47870
ggplot(data=d2, aes(x=ST, y=no, fill=ST)) +geom_bar(stat="identity")+xlab("States")+ylab("People with no self care difficulties")