library(readxl)
veopu <- read_excel("~/Desktop/data selection/veopu.xlsx")
## New names:
## • `` -> `...2`
## • `` -> `...3`
## • `` -> `...4`
## • `` -> `...5`
## • `` -> `...6`
## • `` -> `...7`
## • `` -> `...8`
## • `` -> `...9`
## • `` -> `...10`
## • `` -> `...11`
## • `` -> `...12`
## • `` -> `...13`
## • `` -> `...14`
## • `` -> `...15`
## • `` -> `...16`
## • `` -> `...17`
## • `` -> `...18`
## • `` -> `...19`
## • `` -> `...20`
## • `` -> `...21`
## • `` -> `...22`
## • `` -> `...23`
## • `` -> `...24`
## • `` -> `...25`
## • `` -> `...26`
## • `` -> `...27`
## • `` -> `...28`
## • `` -> `...29`
## • `` -> `...30`
## • `` -> `...31`
## • `` -> `...32`
## • `` -> `...33`
## • `` -> `...34`
# Exploring the data set#
summary(veopu)
## Veterans Employment Outcomes By DOD Occupation and Pay Grade
## Length:153
## Class :character
## Mode :character
## ...2 ...3 ...4 ...5
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...6 ...7 ...8 ...9
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...10 ...11 ...12 ...13
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...14 ...15 ...16 ...17
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...18 ...19 ...20 ...21
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...22 ...23 ...24 ...25
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...26 ...27 ...28 ...29
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...30 ...31 ...32 ...33
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...34
## Length:153
## Class :character
## Mode :character
# sheet = "By DOD Occupation-Geography",
# col_types = c(“text”, “text”, “text”, “text”, “text”, “text”, “text”, “text”, “text”, “text”, “numeric”, “numeric”, “numeric”, “numeric”, “numeric”, “numeric”, “numeric”, “numeric”, “numeric”, “numeric”, “text”, “text”, “text”, “text”, “text”, “text”, “text”, “text”)) # When I ran the code above, with out the #, it prompts R to have SO many errors, so I am changing it to text so that when I submit its not pages of error messages, but I want the attempt to still show
# Exploring the data set part 2 #
summary(veopu)
## Veterans Employment Outcomes By DOD Occupation and Pay Grade
## Length:153
## Class :character
## Mode :character
## ...2 ...3 ...4 ...5
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...6 ...7 ...8 ...9
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...10 ...11 ...12 ...13
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...14 ...15 ...16 ...17
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...18 ...19 ...20 ...21
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...22 ...23 ...24 ...25
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...26 ...27 ...28 ...29
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...30 ...31 ...32 ...33
## Length:153 Length:153 Length:153 Length:153
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
## ...34
## Length:153
## Class :character
## Mode :character
library(readxl)
district <- read_excel("~/Desktop/data selection/district.xls")
# Explore teh data set part 3 #
summary(district)
## DISTNAME DISTRICT DZCNTYNM REGION
## Length:1207 Length:1207 Length:1207 Length:1207
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
##
##
##
##
## DZRATING DZCAMPUS DPETALLC DPETBLAP
## Length:1207 Min. : 1.000 Min. : 4.0 Min. : 0.000
## Class :character 1st Qu.: 2.000 1st Qu.: 337.5 1st Qu.: 0.700
## Mode :character Median : 3.000 Median : 884.0 Median : 2.900
## Mean : 7.428 Mean : 4476.3 Mean : 8.765
## 3rd Qu.: 5.000 3rd Qu.: 2746.0 3rd Qu.:10.750
## Max. :273.000 Max. :193727.0 Max. :98.100
##
## DPETHISP DPETWHIP DPETINDP DPETASIP
## Min. : 0.00 Min. : 0.00 Min. : 0.0000 Min. : 0.000
## 1st Qu.: 21.00 1st Qu.:18.55 1st Qu.: 0.0000 1st Qu.: 0.000
## Median : 37.90 Median :44.40 Median : 0.2000 Median : 0.400
## Mean : 43.29 Mean :43.15 Mean : 0.3283 Mean : 1.614
## 3rd Qu.: 61.90 3rd Qu.:67.75 3rd Qu.: 0.4000 3rd Qu.: 1.000
## Max. :100.00 Max. :97.10 Max. :19.8000 Max. :54.300
##
## DPETPCIP DPETTWOP DPETECOP DPETLEPP
## Min. : 0.0000 Min. : 0.000 Min. : 0.00 Min. : 0.00
## 1st Qu.: 0.0000 1st Qu.: 1.200 1st Qu.: 47.95 1st Qu.: 2.90
## Median : 0.0000 Median : 2.400 Median : 61.90 Median : 7.50
## Mean : 0.1005 Mean : 2.758 Mean : 60.75 Mean : 12.69
## 3rd Qu.: 0.1000 3rd Qu.: 3.900 3rd Qu.: 77.15 3rd Qu.: 17.00
## Max. :14.5000 Max. :15.000 Max. :100.00 Max. :100.00
##
## DPETSPEP DPETBILP DPETVOCP DPETGIFP
## Min. : 0.00 Min. : 0.00 Min. : 0.00 Min. : 0.000
## 1st Qu.: 9.90 1st Qu.: 2.90 1st Qu.:23.00 1st Qu.: 3.100
## Median :12.10 Median : 7.30 Median :27.80 Median : 5.400
## Mean :12.27 Mean : 12.58 Mean :26.47 Mean : 5.574
## 3rd Qu.:14.20 3rd Qu.: 16.80 3rd Qu.:32.90 3rd Qu.: 7.500
## Max. :51.70 Max. :100.00 Max. :82.80 Max. :100.000
##
## DA0AT21R DA0912DR21R DAGC4X21R DAGC5X20R
## Min. : -1.00 Min. :-1.000 Min. : -1.00 Min. : -1.00
## 1st Qu.: 94.05 1st Qu.: 0.000 1st Qu.: 93.20 1st Qu.: 95.50
## Median : 95.40 Median : 0.400 Median : 96.90 Median : 98.30
## Mean : 94.76 Mean : 1.243 Mean : 93.91 Mean : 95.76
## 3rd Qu.: 96.40 3rd Qu.: 1.400 3rd Qu.:100.00 3rd Qu.:100.00
## Max. :100.00 Max. :50.500 Max. :100.00 Max. :100.00
## NA's :4 NA's :112 NA's :133 NA's :141
## DAGC6X19R DA0GR21N DA0GS21N DDA00A001S22R
## Min. : -1.00 Min. : 1.0 Min. : 0.0 Min. : 4.00
## 1st Qu.: 95.20 1st Qu.: 29.0 1st Qu.: 26.0 1st Qu.: 68.00
## Median : 98.20 Median : 69.0 Median : 61.0 Median : 76.00
## Mean : 95.72 Mean : 331.6 Mean : 278.9 Mean : 74.77
## 3rd Qu.:100.00 3rd Qu.: 208.0 3rd Qu.: 167.0 3rd Qu.: 83.00
## Max. :100.00 Max. :11588.0 Max. :9607.0 Max. :100.00
## NA's :149 NA's :126 NA's :126 NA's :5
## DDA00A001222R DDA00A001322R DDA00AR01S22R DDA00AR01222R
## Min. : 0.00 Min. : 0.00 Min. : -1.00 Min. : -1.00
## 1st Qu.:37.00 1st Qu.:15.00 1st Qu.: 70.00 1st Qu.: 43.00
## Median :46.00 Median :20.00 Median : 77.00 Median : 52.00
## Mean :46.48 Mean :21.05 Mean : 76.22 Mean : 52.12
## 3rd Qu.:55.00 3rd Qu.:26.00 3rd Qu.: 84.00 3rd Qu.: 61.00
## Max. :88.00 Max. :64.00 Max. :100.00 Max. :100.00
## NA's :5 NA's :5 NA's :5 NA's :5
## DDA00AR01322R DDA00AM01S22R DDA00AM01222R DDA00AM01322R
## Min. :-1.00 Min. : -1.00 Min. :-1.00 Min. :-1.00
## 1st Qu.:17.00 1st Qu.: 66.00 1st Qu.:30.00 1st Qu.:11.00
## Median :22.00 Median : 74.00 Median :40.00 Median :17.00
## Mean :23.64 Mean : 72.78 Mean :40.51 Mean :18.21
## 3rd Qu.:29.00 3rd Qu.: 82.00 3rd Qu.:50.00 3rd Qu.:23.00
## Max. :66.00 Max. :100.00 Max. :91.00 Max. :65.00
## NA's :5 NA's :5 NA's :5 NA's :5
## DDA00AC01S22R DDA00AC01222R DDA00AC01322R DDA00AS01S22R
## Min. : -1.00 Min. : -1.00 Min. :-1.00 Min. : -1.00
## 1st Qu.: 68.00 1st Qu.: 34.00 1st Qu.:10.00 1st Qu.: 66.00
## Median : 77.00 Median : 44.00 Median :16.00 Median : 75.00
## Mean : 75.04 Mean : 44.29 Mean :17.39 Mean : 73.09
## 3rd Qu.: 85.00 3rd Qu.: 55.00 3rd Qu.:23.00 3rd Qu.: 83.00
## Max. :100.00 Max. :100.00 Max. :56.00 Max. :100.00
## NA's :11 NA's :11 NA's :11 NA's :43
## DDA00AS01222R DDA00AS01322R DDB00A001S22R DDB00A001222R
## Min. : -1.0 Min. :-1.00 Min. : -1.00 Min. : -1.0
## 1st Qu.: 37.0 1st Qu.:17.00 1st Qu.: 50.00 1st Qu.: 21.0
## Median : 46.0 Median :24.00 Median : 63.00 Median : 31.0
## Mean : 45.7 Mean :25.29 Mean : 57.65 Mean : 31.5
## 3rd Qu.: 55.0 3rd Qu.:32.00 3rd Qu.: 74.50 3rd Qu.: 43.0
## Max. :100.0 Max. :77.00 Max. :100.00 Max. :100.0
## NA's :43 NA's :43 NA's :192 NA's :192
## DDB00A001322R DDH00A001S22R DDH00A001222R DDH00A001322R
## Min. :-1.00 Min. : -1.0 Min. : -1.00 Min. :-1.00
## 1st Qu.: 5.00 1st Qu.: 66.0 1st Qu.: 34.00 1st Qu.:12.00
## Median :11.00 Median : 73.0 Median : 41.00 Median :16.00
## Mean :12.45 Mean : 71.7 Mean : 41.63 Mean :16.86
## 3rd Qu.:17.00 3rd Qu.: 80.0 3rd Qu.: 49.00 3rd Qu.:21.00
## Max. :90.00 Max. :100.0 Max. :100.00 Max. :59.00
## NA's :192 NA's :6 NA's :6 NA's :6
## DDW00A001S22R DDW00A001222R DDW00A001322R DDI00A001S22R
## Min. : -1.00 Min. : -1.00 Min. :-1.00 Min. : -1.0
## 1st Qu.: 75.00 1st Qu.: 45.00 1st Qu.:19.00 1st Qu.: -1.0
## Median : 82.00 Median : 54.00 Median :26.00 Median : 66.0
## Mean : 78.69 Mean : 53.24 Mean :26.15 Mean : 50.8
## 3rd Qu.: 88.00 3rd Qu.: 63.00 3rd Qu.:33.00 3rd Qu.: 83.0
## Max. :100.00 Max. :100.00 Max. :79.00 Max. :100.0
## NA's :26 NA's :26 NA's :26 NA's :472
## DDI00A001222R DDI00A001322R DD300A001S22R DD300A001222R
## Min. : -1.00 Min. : -1.00 Min. : -1.0 Min. : -1.00
## 1st Qu.: -1.00 1st Qu.: -1.00 1st Qu.: 50.0 1st Qu.: 17.00
## Median : 35.00 Median : 11.00 Median : 89.0 Median : 67.00
## Mean : 32.08 Mean : 14.35 Mean : 67.8 Mean : 53.76
## 3rd Qu.: 54.00 3rd Qu.: 23.00 3rd Qu.: 96.0 3rd Qu.: 80.00
## Max. :100.00 Max. :100.00 Max. :100.0 Max. :100.00
## NA's :472 NA's :472 NA's :423 NA's :423
## DD300A001322R DD400A001S22R DD400A001222R DD400A001322R
## Min. : -1.00 Min. : -1.00 Min. : -1.00 Min. :-1.00
## 1st Qu.: 0.00 1st Qu.: -1.00 1st Qu.: -1.00 1st Qu.:-1.00
## Median : 37.00 Median : 60.00 Median : 22.50 Median : 0.00
## Mean : 33.08 Mean : 44.08 Mean : 29.23 Mean :14.05
## 3rd Qu.: 52.00 3rd Qu.: 83.00 3rd Qu.: 56.75 3rd Qu.:25.75
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :83.00
## NA's :423 NA's :797 NA's :797 NA's :797
## DD200A001S22R DD200A001222R DD200A001322R DDE00A001S22R
## Min. : -1.00 Min. : -1.00 Min. : -1.00 Min. : -1.00
## 1st Qu.: 64.00 1st Qu.: 33.00 1st Qu.: 10.00 1st Qu.: 63.00
## Median : 76.00 Median : 47.00 Median : 20.00 Median : 70.00
## Mean : 68.18 Mean : 43.98 Mean : 21.06 Mean : 69.68
## 3rd Qu.: 86.00 3rd Qu.: 60.00 3rd Qu.: 30.00 3rd Qu.: 77.00
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
## NA's :133 NA's :133 NA's :133 NA's :10
## DDE00A001222R DDE00A001322R DA0CT21R DA0CC21R
## Min. : -1.00 Min. :-1.0 Min. : -2.00 Min. :-1.00
## 1st Qu.: 32.00 1st Qu.:12.0 1st Qu.: 40.42 1st Qu.:12.90
## Median : 39.00 Median :15.0 Median : 63.05 Median :23.55
## Mean : 39.23 Mean :15.9 Mean : 60.76 Mean :26.10
## 3rd Qu.: 46.00 3rd Qu.:19.0 3rd Qu.: 85.38 3rd Qu.:37.08
## Max. :100.00 Max. :80.0 Max. :100.00 Max. :97.70
## NA's :10 NA's :10 NA's :125 NA's :147
## DA0CSA21R DA0CAA21R DPSATOFC DPSTTOFC
## Min. : -1.0 Min. :-1.00 Min. : 1.0 Min. : 0.00
## 1st Qu.: 887.0 1st Qu.:16.30 1st Qu.: 58.9 1st Qu.: 30.57
## Median : 973.0 Median :19.00 Median : 144.1 Median : 72.00
## Mean : 823.9 Mean :16.13 Mean : 622.5 Mean : 307.06
## 3rd Qu.:1039.0 3rd Qu.:21.20 3rd Qu.: 405.2 3rd Qu.: 196.50
## Max. :1344.0 Max. :31.40 Max. :23716.2 Max. :10619.50
## NA's :262 NA's :236 NA's :3 NA's :3
## DPSCTOFP DPSSTOFP DPSUTOFP DPSTTOFP
## Min. : 0.000 Min. : 0.00 Min. : 0.000 Min. : 0.00
## 1st Qu.: 1.200 1st Qu.: 2.60 1st Qu.: 4.100 1st Qu.:46.60
## Median : 1.800 Median : 3.10 Median : 6.600 Median :50.80
## Mean : 2.178 Mean : 3.58 Mean : 7.169 Mean :50.98
## 3rd Qu.: 2.600 3rd Qu.: 3.90 3rd Qu.: 9.800 3rd Qu.:54.80
## Max. :14.900 Max. :100.00 Max. :49.700 Max. :88.30
## NA's :3 NA's :3 NA's :3 NA's :3
## DPSETOFP DPSXTOFP DPSCTOSA DPSSTOSA
## Min. : 0.00 Min. : 0.00 Min. : -2 Min. : -2
## 1st Qu.: 9.70 1st Qu.:19.38 1st Qu.: 95459 1st Qu.: 73469
## Median :12.60 Median :23.65 Median :106674 Median : 78723
## Mean :12.95 Mean :23.14 Mean :108039 Mean : 79435
## 3rd Qu.:16.20 3rd Qu.:27.50 3rd Qu.:119540 3rd Qu.: 84944
## Max. :48.80 Max. :55.40 Max. :270000 Max. :192500
## NA's :3 NA's :3 NA's :10 NA's :11
## DPSUTOSA DPSTTOSA DPSAMIFP DPSAKIDR
## Min. : -2 Min. : 36081 Min. : 0.00 Min. : 0.100
## 1st Qu.: 57969 1st Qu.: 50439 1st Qu.: 13.30 1st Qu.: 5.400
## Median : 63015 Median : 53382 Median : 26.60 Median : 6.300
## Mean : 62424 Mean : 53971 Mean : 35.24 Mean : 6.734
## 3rd Qu.: 67941 3rd Qu.: 56919 3rd Qu.: 50.62 3rd Qu.: 7.300
## Max. :228972 Max. :110560 Max. :100.00 Max. :349.100
## NA's :54 NA's :4 NA's :3 NA's :3
## DPSTKIDR DPST05FP DPSTEXPA DPSTADFP
## Min. :-2.00 Min. : 0.00 Min. : 0.00 Min. : 0.00
## 1st Qu.:10.80 1st Qu.: 24.35 1st Qu.:10.07 1st Qu.:14.88
## Median :12.70 Median : 32.40 Median :12.00 Median :20.90
## Mean :12.56 Mean : 34.88 Mean :11.75 Mean :20.86
## 3rd Qu.:14.40 3rd Qu.: 41.65 3rd Qu.:13.90 3rd Qu.:26.12
## Max. :37.30 Max. :100.00 Max. :22.90 Max. :78.70
## NA's :3 NA's :3 NA's :3 NA's :3
## DPSTURNR DPSTBLFP DPSTHIFP DPSTWHFP
## Min. : 0.00 Min. : 0.00 Min. : 0.00 Min. : 0.00
## 1st Qu.: 14.80 1st Qu.: 0.00 1st Qu.: 4.20 1st Qu.: 58.67
## Median : 19.50 Median : 1.60 Median : 10.10 Median : 82.40
## Mean : 21.51 Mean : 6.99 Mean : 19.05 Mean : 71.57
## 3rd Qu.: 25.90 3rd Qu.: 6.20 3rd Qu.: 22.50 3rd Qu.: 92.60
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
## NA's :7 NA's :3 NA's :3 NA's :3
## DPSTINFP DPSTASFP DPSTPIFP DPSTTWFP
## Min. : 0.0000 Min. : 0.000 Min. :0.00000 Min. : 0.0000
## 1st Qu.: 0.0000 1st Qu.: 0.000 1st Qu.:0.00000 1st Qu.: 0.0000
## Median : 0.0000 Median : 0.000 Median :0.00000 Median : 0.0000
## Mean : 0.3566 Mean : 1.118 Mean :0.08206 Mean : 0.7566
## 3rd Qu.: 0.3000 3rd Qu.: 0.900 3rd Qu.:0.00000 3rd Qu.: 1.2000
## Max. :16.7000 Max. :94.800 Max. :7.80000 Max. :11.7000
## NA's :3 NA's :3 NA's :3 NA's :3
## DPSTREFP DPSTSPFP DPSTCOFP DPSTBIFP
## Min. : 0.00 Min. : 0.000 Min. : 0.000 Min. : 0.000
## 1st Qu.: 71.00 1st Qu.: 4.500 1st Qu.: 0.000 1st Qu.: 0.000
## Median : 76.90 Median : 7.000 Median : 3.350 Median : 0.000
## Mean : 76.87 Mean : 7.145 Mean : 4.131 Mean : 2.311
## 3rd Qu.: 82.42 3rd Qu.: 9.600 3rd Qu.: 6.125 3rd Qu.: 2.100
## Max. :100.00 Max. :22.800 Max. :32.500 Max. :94.300
## NA's :3 NA's :3 NA's :3 NA's :3
## DPSTVOFP DPSTGOFP DPFVTOTK DPFTADPR
## Min. : 0.000 Min. : 0.000 Min. : 0 Min. :0.0000
## 1st Qu.: 4.800 1st Qu.: 0.000 1st Qu.: 238299 1st Qu.:0.9892
## Median : 7.000 Median : 1.200 Median : 419144 Median :1.1670
## Mean : 7.154 Mean : 2.308 Mean : 665067 Mean :1.0212
## 3rd Qu.: 9.425 3rd Qu.: 3.700 3rd Qu.: 670248 3rd Qu.:1.3017
## Max. :71.900 Max. :30.800 Max. :26416597 Max. :1.7480
## NA's :3 NA's :3 NA's :5 NA's :5
## DPFRAALLT DPFRAALLK DPFRAOPRT DPFRASTAP
## Min. :6.428e+05 Min. : 8923 Min. :6.428e+05 Min. : 1.70
## 1st Qu.:5.828e+06 1st Qu.: 12953 1st Qu.:5.524e+06 1st Qu.: 33.85
## Median :1.381e+07 Median : 14653 Median :1.241e+07 Median : 51.00
## Mean :5.995e+07 Mean : 16365 Mean :5.129e+07 Mean : 49.05
## 3rd Qu.:3.805e+07 3rd Qu.: 17081 3rd Qu.:3.241e+07 3rd Qu.: 64.80
## Max. :2.619e+09 Max. :214078 Max. :2.213e+09 Max. :103.40
## NA's :5 NA's :5 NA's :5 NA's :5
## DZRVLOCP DPFRAFEDP DPFRAORVT DPFUNAB1T
## Min. :-6.20 Min. : 0.00 Min. : -655726 Min. : -746998
## 1st Qu.:21.10 1st Qu.: 8.70 1st Qu.: 98311 1st Qu.: 1226730
## Median :35.30 Median :12.30 Median : 1093332 Median : 3589384
## Mean :37.92 Mean :13.04 Mean : 8659622 Mean : 13498263
## 3rd Qu.:53.70 3rd Qu.:16.20 3rd Qu.: 4471240 3rd Qu.: 9357248
## Max. :97.60 Max. :49.00 Max. :405596099 Max. :662450197
## NA's :5 NA's :5 NA's :5 NA's :5
## DPFUNA4T DPFEAALLT DPFEAOPFT DPFEAOPFK
## Min. : -7033092 Min. :6.229e+05 Min. :6.120e+05 Min. : 6755
## 1st Qu.: 0 1st Qu.:5.475e+06 1st Qu.:4.754e+06 1st Qu.: 10916
## Median : 0 Median :1.328e+07 Median :1.102e+07 Median : 12228
## Mean : 510514 Mean :6.597e+07 Mean :4.951e+07 Mean : 13121
## 3rd Qu.: 0 3rd Qu.:3.787e+07 3rd Qu.:3.038e+07 3rd Qu.: 14012
## Max. :126144201 Max. :2.656e+09 Max. :2.068e+09 Max. :178467
## NA's :5 NA's :5 NA's :5 NA's :5
## DPFEAINSP DZEXADMP DZEXADSP DZEXPLAP
## Min. :18.50 Min. : 2.700 Min. : 0.000 Min. : 0.20
## 1st Qu.:52.00 1st Qu.: 7.125 1st Qu.: 4.900 1st Qu.:10.40
## Median :55.10 Median : 8.800 Median : 5.700 Median :11.80
## Mean :54.73 Mean : 9.606 Mean : 6.015 Mean :12.46
## 3rd Qu.:57.80 3rd Qu.:11.200 3rd Qu.: 6.400 3rd Qu.:13.50
## Max. :84.40 Max. :35.800 Max. :22.700 Max. :43.10
## NA's :5 NA's :5 NA's :5 NA's :5
## DZEXOTHP DPFEAINST DPFEAINSK DPFPAREGP
## Min. : 0.30 Min. :2.439e+05 Min. : 3122 Min. : 0.00
## 1st Qu.:15.30 1st Qu.:2.563e+06 1st Qu.: 6056 1st Qu.:35.12
## Median :18.00 Median :6.013e+06 Median : 6702 Median :39.70
## Mean :17.15 Mean :2.835e+07 Mean : 7074 Mean :39.80
## 3rd Qu.:20.00 3rd Qu.:1.683e+07 3rd Qu.: 7577 3rd Qu.:43.90
## Max. :69.30 Max. :1.177e+09 Max. :54954 Max. :79.10
## NA's :5 NA's :5 NA's :5 NA's :5
## DPFPASPEP DPFPACOMP DPFPABILP DPFPAVOCP
## Min. : 0.000 Min. : 0.000 Min. : 0.0000 Min. : 0.00
## 1st Qu.: 5.800 1st Qu.: 6.500 1st Qu.: 0.1000 1st Qu.: 2.90
## Median : 8.900 Median : 9.200 Median : 0.4000 Median : 4.10
## Mean : 9.711 Mean : 9.883 Mean : 0.7496 Mean : 3.96
## 3rd Qu.:12.500 3rd Qu.:12.100 3rd Qu.: 1.0000 3rd Qu.: 5.20
## Max. :49.000 Max. :90.600 Max. :26.0000 Max. :19.80
## NA's :5 NA's :5 NA's :5 NA's :5
## DPFPAGIFP DPFPAATHP DPFPAHSAP DPFPREKP
## Min. :0.0000 Min. :0.000 Min. :0.0000 Min. : 0.0000
## 1st Qu.:0.0000 1st Qu.:1.600 1st Qu.:0.0000 1st Qu.: 0.0000
## Median :0.2000 Median :2.900 Median :0.0000 Median : 0.6000
## Mean :0.3823 Mean :2.809 Mean :0.1578 Mean : 0.8909
## 3rd Qu.:0.4000 3rd Qu.:4.000 3rd Qu.:0.1000 3rd Qu.: 1.3000
## Max. :6.9000 Max. :9.000 Max. :3.4000 Max. :31.7000
## NA's :5 NA's :5 NA's :5 NA's :5
## DPFPAOTHP DISTSIZE COMMTYPE PROPWLTH
## Min. : 3.50 Length:1207 Length:1207 Length:1207
## 1st Qu.:25.40 Class :character Class :character Class :character
## Median :28.70 Mode :character Mode :character Mode :character
## Mean :29.22
## 3rd Qu.:32.40
## Max. :76.30
## NA's :5
## TAXRATE
## Length:1207
## Class :character
## Mode :character
##
##
##
##
# To condense the potential data, I want to focus on some key points: SAT scores: DA0CSA21R, ACT scores: DA0CAA21R , Number of Students per teacher: DPSTKIDR, Expenditure: % Instructional: DPFEAINSP, EXPENDITURE: % BASIC EDUCATION SERVICES: DPFPAREGP #
summary(district$DA0CSA21R)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## -1.0 887.0 973.0 823.9 1039.0 1344.0 262
summary(district$DA0CAA21R)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## -1.00 16.30 19.00 16.13 21.20 31.40 236
summary(district$DPSTKIDR)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## -2.00 10.80 12.70 12.56 14.40 37.30 3
summary(district$DPFEAINSP)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## 18.50 52.00 55.10 54.73 57.80 84.40 5
summary(district$DPFPAREGP)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## 0.00 35.12 39.70 39.80 43.90 79.10 5
# more exploring with graphs
hist(district$DPFEAINSP)
plot(district$DA0CSA21R,district$DPFPAREGP) #or
plot(district$DA0CSA21R,district$DPSTKIDR)
#some correlation data
cor(district$DA0CSA21R,district$DPSTKIDR)
## [1] NA
# attempting to clean data
clean_district <- na.omit(district)
hist(clean_district$DPFEAINSP)
plot(clean_district$DA0CSA21R,clean_district$DPFPAREGP)
plot(clean_district$DA0CSA21R,clean_district$DPSTKIDR)
cor(clean_district$DA0CSA21R,clean_district$DPSTKIDR)
## [1] 0.05558606