Attempt to regress the LCN data
Intro stuff
setwd( "C:/Users/Jerome/Documents/Data_Science_110/Datasets")
library(tidyverse)
## -- Attaching packages ----------------------------------------------------------------------------------------------- tidyverse 1.3.0 --
## v ggplot2 3.3.2 v purrr 0.3.4
## v tibble 3.0.1 v dplyr 1.0.0
## v tidyr 1.1.0 v stringr 1.4.0
## v readr 1.3.1 v forcats 0.5.0
## -- Conflicts -------------------------------------------------------------------------------------------------- tidyverse_conflicts() --
## x dplyr::filter() masks stats::filter()
## x dplyr::lag() masks stats::lag()
library(ggplot2)
Load the data set
lcn_fpf_co_names_sample <- read.csv("lcn_fpf_co_names_sample.csv")
Select a random sample of 175 cases
sample_n(lcn_fpf_co_names_sample, 175, replace = FALSE)
## ENTRY MEASURE SCORE Svy_Year Birth_Year Gender County Co_Name Region
## 1 3403 56.96 5 2007 1998 2 6 Grand Gedeh 4
## 2 6036 48.02 3 2007 2003 2 9 Margibi 3
## 3 7526 53.07 4 2007 2005 1 7 Grand Kru 5
## 4 3220 53.07 4 2007 1997 2 12 Nimba 6
## 5 16482 53.07 4 2013 2010 2 10 Maryland 4
## 6 16692 40.34 2 2013 2011 1 1 Bomi 1
## 7 6620 56.96 5 2007 2004 1 6 Grand Gedeh 4
## 8 6209 48.02 3 2007 2003 2 11 Montserrado 1
## 9 8996 21.13 1 2007 2006 2 12 Nimba 6
## 10 2036 85.42 15 2007 1994 1 10 Maryland 5
## 11 13306 53.07 4 2013 2005 2 7 Grand Kru 4
## 12 10549 60.25 6 2013 1998 2 1 Bomi 1
## 13 8725 40.34 2 2007 2006 2 11 Montserrado 1
## 14 16005 60.25 6 2013 2009 1 12 Nimba 5
## 15 5738 56.96 5 2007 2002 1 14 River Gee 5
## 16 15352 0.01 0 2013 2008 1 11 Montserrado 2
## 17 9345 21.13 1 2013 1986 1 12 Nimba 5
## 18 12343 0.01 0 2013 2003 2 8 Lofa 5
## 19 5494 60.25 6 2007 2002 1 9 Margibi 3
## 20 8580 40.34 2 2007 2006 2 9 Margibi 3
## 21 2635 56.96 5 2007 1996 1 10 Maryland 5
## 22 2753 53.07 4 2007 1996 1 12 Nimba 6
## 23 2250 0.01 0 2007 1995 1 6 Grand Gedeh 4
## 24 7985 21.13 1 2007 2005 2 12 Nimba 6
## 25 7092 65.85 8 2007 2004 2 12 Nimba 6
## 26 9628 21.13 1 2013 1992 1 7 Grand Kru 4
## 27 15108 56.96 5 2013 2008 1 5 Grand Cape Mt 1
## 28 9436 56.96 5 2013 1989 1 12 Nimba 5
## 29 1193 65.85 8 2007 1991 1 9 Margibi 3
## 30 10022 48.02 3 2013 1995 2 6 Grand Gedeh 3
## 31 3162 68.40 9 2007 1997 1 11 Montserrado 1
## 32 202 21.13 1 2007 1984 2 3 Gbarpolu 2
## 33 2350 91.13 16 2007 1995 1 11 Montserrado 1
## 34 17956 56.96 5 2013 2012 2 4 Grand Bassa 2
## 35 15433 0.01 0 2013 2008 2 13 River Cess 3
## 36 1747 63.17 7 2007 1993 1 11 Montserrado 1
## 37 10095 0.01 0 2013 1995 2 12 Nimba 5
## 38 17140 56.96 5 2013 2011 2 9 Margibi 2
## 39 4719 53.07 4 2007 2000 1 12 Nimba 6
## 40 3828 53.07 4 2007 1999 1 4 Grand Bassa 3
## 41 15668 56.96 5 2013 2009 2 4 Grand Bassa 2
## 42 15018 48.02 3 2013 2008 2 2 Bong 5
## 43 7447 56.96 5 2007 2005 2 6 Grand Gedeh 4
## 44 11695 40.34 2 2013 2001 2 14 River Gee 4
## 45 901 48.02 3 2007 1990 1 3 Gbarpolu 2
## 46 16878 60.25 6 2013 2011 2 4 Grand Bassa 2
## 47 5910 48.02 3 2007 2003 1 4 Grand Bassa 3
## 48 704 53.07 4 2007 1988 2 12 Nimba 6
## 49 7841 63.17 7 2007 2005 2 11 Montserrado 1
## 50 7617 53.07 4 2007 2005 1 9 Margibi 3
## 51 7357 21.13 1 2007 2005 1 3 Gbarpolu 2
## 52 10725 60.25 6 2013 1998 2 12 Nimba 5
## 53 13024 0.01 0 2013 2004 1 14 River Gee 4
## 54 1311 21.13 1 2007 1992 2 2 Bong 6
## 55 10404 40.34 2 2013 1997 2 7 Grand Kru 4
## 56 17732 0.01 0 2013 2012 1 2 Bong 5
## 57 4934 56.96 5 2007 2001 2 6 Grand Gedeh 4
## 58 11919 53.07 4 2013 2002 2 8 Lofa 5
## 59 15931 21.13 1 2013 2009 1 10 Maryland 4
## 60 12981 53.07 4 2013 2004 1 12 Nimba 5
## 61 43 73.32 11 2007 1980 2 10 Maryland 5
## 62 1160 53.07 4 2007 1991 2 6 Grand Gedeh 4
## 63 11077 40.34 2 2013 1999 1 15 Sinoe 3
## 64 3244 0.01 0 2007 1997 2 14 River Gee 5
## 65 17502 0.01 0 2013 2011 1 14 River Gee 4
## 66 15242 0.01 0 2013 2008 1 8 Lofa 5
## 67 13406 53.07 4 2013 2005 2 10 Maryland 4
## 68 12019 21.13 1 2013 2002 2 12 Nimba 5
## 69 13320 21.13 1 2013 2005 2 7 Grand Kru 4
## 70 10291 60.25 6 2013 1996 1 13 River Cess 3
## 71 11613 53.07 4 2013 2001 2 11 Montserrado 2
## 72 220 56.96 5 2007 1984 1 6 Grand Gedeh 4
## 73 14403 21.13 1 2013 2007 2 3 Gbarpolu 1
## 74 2340 68.40 9 2007 1995 2 11 Montserrado 1
## 75 2562 56.96 5 2007 1996 2 7 Grand Kru 5
## 76 14786 48.02 3 2013 2007 1 12 Nimba 5
## 77 11091 0.01 0 2013 2000 2 1 Bomi 1
## 78 2108 63.17 7 2007 1994 2 12 Nimba 6
## 79 10866 0.01 0 2013 1999 1 4 Grand Bassa 2
## 80 5794 21.13 1 2007 2003 2 1 Bomi 2
## 81 7537 60.25 6 2007 2005 1 8 Lofa 6
## 82 12980 0.01 0 2013 2004 2 12 Nimba 5
## 83 8053 85.42 15 2007 2005 1 14 River Gee 5
## 84 14421 63.17 7 2013 2007 2 3 Gbarpolu 1
## 85 13468 63.17 7 2013 2005 2 11 Montserrado 2
## 86 5382 53.07 4 2007 2002 1 6 Grand Gedeh 4
## 87 15027 56.96 5 2013 2008 2 2 Bong 5
## 88 12513 21.13 1 2013 2003 1 13 River Cess 3
## 89 15459 56.96 5 2013 2008 2 13 River Cess 3
## 90 12124 0.01 0 2013 2002 2 15 Sinoe 3
## 91 2529 0.01 0 2007 1996 1 5 Grand Cape Mt 2
## 92 8507 40.34 2 2007 2006 2 8 Lofa 6
## 93 10358 48.02 3 2013 1997 2 4 Grand Bassa 2
## 94 11834 21.13 1 2013 2002 1 5 Grand Cape Mt 1
## 95 5177 60.25 6 2007 2001 1 12 Nimba 6
## 96 1391 70.86 10 2007 1992 2 8 Lofa 6
## 97 4425 63.17 7 2007 2000 2 8 Lofa 6
## 98 1263 53.07 4 2007 1991 1 12 Nimba 6
## 99 10294 60.25 6 2013 1996 1 14 River Gee 4
## 100 16499 0.01 0 2013 2010 2 11 Montserrado 2
## 101 3214 65.85 8 2007 1997 1 12 Nimba 6
## 102 5735 21.13 1 2007 2002 1 14 River Gee 5
## 103 8769 63.17 7 2007 2006 2 11 Montserrado 1
## 104 8474 48.02 3 2007 2006 2 8 Lofa 6
## 105 6837 68.40 9 2007 2004 1 10 Maryland 5
## 106 11003 21.13 1 2013 1999 1 12 Nimba 5
## 107 6172 56.96 5 2007 2003 2 11 Montserrado 1
## 108 14357 0.01 0 2013 2007 1 2 Bong 5
## 109 17797 56.96 5 2013 2012 2 3 Gbarpolu 1
## 110 17185 53.07 4 2013 2011 1 10 Maryland 4
## 111 6559 21.13 1 2007 2004 1 5 Grand Cape Mt 2
## 112 14338 0.01 0 2013 2007 1 2 Bong 5
## 113 19583 21.13 1 2013 2013 2 11 Montserrado 2
## 114 18598 56.96 5 2013 2012 1 11 Montserrado 2
## 115 5437 56.96 5 2007 2002 1 7 Grand Kru 5
## 116 9400 65.85 8 2013 1989 1 1 Bomi 1
## 117 15974 60.25 6 2013 2009 2 11 Montserrado 2
## 118 6309 21.13 1 2007 2003 2 14 River Gee 5
## 119 748 56.96 5 2007 1989 1 4 Grand Bassa 3
## 120 175 56.96 5 2007 1983 2 11 Montserrado 1
## 121 7311 68.40 9 2007 2005 2 3 Gbarpolu 2
## 122 5012 56.96 5 2007 2001 1 9 Margibi 3
## 123 130 21.13 1 2007 1982 2 12 Nimba 6
## 124 6801 73.32 11 2007 2004 1 10 Maryland 5
## 125 15842 21.13 1 2013 2009 1 7 Grand Kru 4
## 126 671 48.02 3 2007 1988 2 10 Maryland 5
## 127 9168 21.13 1 2007 2006 1 15 Sinoe 4
## 128 1892 60.25 6 2007 1994 2 3 Gbarpolu 2
## 129 6380 40.34 2 2007 2004 2 2 Bong 6
## 130 5547 68.40 9 2007 2002 1 10 Maryland 5
## 131 17379 53.07 4 2013 2011 2 12 Nimba 5
## 132 10123 0.01 0 2013 1995 1 14 River Gee 4
## 133 19253 21.13 1 2013 2013 2 2 Bong 5
## 134 12039 21.13 1 2013 2002 2 12 Nimba 5
## 135 4994 60.25 6 2007 2001 2 9 Margibi 3
## 136 14673 0.01 0 2013 2007 2 9 Margibi 2
## 137 837 48.02 3 2007 1989 2 12 Nimba 6
## 138 10989 53.07 4 2013 1999 1 11 Montserrado 2
## 139 8029 53.07 4 2007 2005 1 13 River Cess 4
## 140 13752 60.25 6 2013 2006 1 3 Gbarpolu 1
## 141 15420 60.25 6 2013 2008 2 13 River Cess 3
## 142 16022 0.01 0 2013 2009 2 12 Nimba 5
## 143 12839 0.01 0 2013 2004 2 8 Lofa 5
## 144 9923 56.96 5 2013 1994 1 10 Maryland 4
## 145 12097 21.13 1 2013 2002 1 14 River Gee 4
## 146 5074 70.86 10 2007 2001 1 11 Montserrado 1
## 147 7778 60.25 6 2007 2005 1 11 Montserrado 1
## 148 3406 0.01 0 2007 1998 2 6 Grand Gedeh 4
## 149 8781 56.96 5 2007 2006 1 11 Montserrado 1
## 150 2041 21.13 1 2007 1994 1 10 Maryland 5
## 151 2721 70.86 10 2007 1996 1 11 Montserrado 1
## 152 2388 21.13 1 2007 1995 1 12 Nimba 6
## 153 11809 21.13 1 2013 2002 1 4 Grand Bassa 2
## 154 16740 56.96 5 2013 2011 1 2 Bong 5
## 155 11772 53.07 4 2013 2002 2 2 Bong 5
## 156 12386 0.01 0 2013 2003 1 9 Margibi 2
## 157 12251 21.13 1 2013 2003 1 5 Grand Cape Mt 1
## 158 18194 21.13 1 2013 2012 2 7 Grand Kru 4
## 159 3277 85.42 15 2007 1997 2 15 Sinoe 4
## 160 10177 21.13 1 2013 1996 2 4 Grand Bassa 2
## 161 5400 60.25 6 2007 2002 2 6 Grand Gedeh 4
## 162 3001 56.96 5 2007 1997 1 7 Grand Kru 5
## 163 6018 0.01 0 2007 2003 2 8 Lofa 6
## 164 2474 56.96 5 2007 1996 2 2 Bong 6
## 165 1566 60.25 6 2007 1993 2 2 Bong 6
## 166 5873 60.25 6 2007 2003 1 3 Gbarpolu 2
## 167 9966 60.25 6 2013 1994 2 14 River Gee 4
## 168 18109 21.13 1 2013 2012 1 6 Grand Gedeh 3
## 169 4888 81.61 14 2007 2001 2 4 Grand Bassa 3
## 170 568 60.25 6 2007 1987 2 12 Nimba 6
## 171 16178 48.02 3 2013 2009 2 15 Sinoe 3
## 172 7996 56.96 5 2007 2005 1 12 Nimba 6
## 173 7531 73.32 11 2007 2005 2 8 Lofa 6
## 174 12530 56.96 5 2013 2003 1 13 River Cess 3
## 175 10477 56.96 5 2013 1997 1 12 Nimba 5
## UrbRur Educ Wealth
## 1 2 0 1
## 2 2 0 2
## 3 2 1 3
## 4 2 0 3
## 5 2 0 3
## 6 1 3 4
## 7 1 1 3
## 8 1 2 5
## 9 2 1 1
## 10 1 1 3
## 11 2 0 1
## 12 2 0 3
## 13 1 3 4
## 14 1 1 2
## 15 2 0 2
## 16 2 0 2
## 17 2 1 2
## 18 2 0 1
## 19 2 0 2
## 20 2 0 5
## 21 2 0 2
## 22 2 0 3
## 23 2 0 2
## 24 2 0 3
## 25 1 0 4
## 26 2 0 3
## 27 2 1 3
## 28 2 1 3
## 29 2 0 3
## 30 2 3 2
## 31 1 0 4
## 32 2 4 2
## 33 1 0 3
## 34 2 1 1
## 35 2 1 1
## 36 1 0 4
## 37 2 0 3
## 38 1 3 3
## 39 2 1 1
## 40 2 0 3
## 41 2 1 1
## 42 2 1 3
## 43 2 0 1
## 44 1 3 4
## 45 1 0 2
## 46 2 0 2
## 47 2 0 1
## 48 2 3 3
## 49 1 0 5
## 50 2 1 3
## 51 2 0 1
## 52 1 0 2
## 53 2 2 1
## 54 2 0 2
## 55 2 0 2
## 56 1 0 1
## 57 2 1 3
## 58 2 0 1
## 59 1 1 3
## 60 2 1 4
## 61 1 4 4
## 62 2 0 4
## 63 1 0 5
## 64 2 1 2
## 65 2 3 1
## 66 2 0 1
## 67 2 1 1
## 68 2 0 2
## 69 2 3 1
## 70 2 0 2
## 71 1 3 5
## 72 2 0 2
## 73 1 4 3
## 74 1 0 5
## 75 2 4 4
## 76 1 1 2
## 77 2 0 1
## 78 1 5 5
## 79 2 0 1
## 80 1 0 2
## 81 2 0 2
## 82 1 1 2
## 83 2 1 2
## 84 2 0 1
## 85 1 0 4
## 86 2 2 1
## 87 1 1 3
## 88 2 0 2
## 89 2 1 1
## 90 2 0 1
## 91 2 0 4
## 92 2 0 2
## 93 2 0 1
## 94 2 0 5
## 95 2 0 4
## 96 1 0 4
## 97 2 0 2
## 98 2 0 1
## 99 2 1 1
## 100 1 1 4
## 101 2 2 3
## 102 2 3 2
## 103 1 1 4
## 104 2 0 3
## 105 2 1 4
## 106 2 1 1
## 107 1 3 3
## 108 2 0 2
## 109 2 1 2
## 110 2 0 1
## 111 2 0 2
## 112 2 0 2
## 113 1 2 4
## 114 1 0 5
## 115 2 0 1
## 116 1 0 3
## 117 1 2 4
## 118 2 0 1
## 119 2 0 2
## 120 1 3 3
## 121 2 0 2
## 122 2 0 2
## 123 2 0 3
## 124 1 3 4
## 125 2 0 1
## 126 2 1 2
## 127 2 1 2
## 128 2 0 3
## 129 2 0 1
## 130 2 0 1
## 131 2 3 3
## 132 2 1 1
## 133 2 0 2
## 134 2 1 1
## 135 2 0 4
## 136 2 3 4
## 137 2 3 3
## 138 1 3 5
## 139 2 2 1
## 140 2 0 2
## 141 2 0 1
## 142 2 1 2
## 143 2 4 2
## 144 1 0 5
## 145 1 0 4
## 146 1 0 4
## 147 1 5 5
## 148 1 0 2
## 149 1 3 4
## 150 1 0 3
## 151 1 1 4
## 152 2 0 1
## 153 2 0 1
## 154 1 0 1
## 155 2 0 1
## 156 2 1 3
## 157 1 0 2
## 158 2 0 3
## 159 2 3 2
## 160 2 0 1
## 161 2 1 2
## 162 2 3 4
## 163 2 0 2
## 164 2 1 4
## 165 2 0 1
## 166 2 0 1
## 167 2 1 1
## 168 2 0 1
## 169 1 1 4
## 170 2 0 2
## 171 1 0 1
## 172 2 0 3
## 173 2 3 2
## 174 2 0 1
## 175 2 3 1
Try again
##lcn_sample <- sample_n(lcn_fpf_co_names_sample, 175, replace = FALSE)
##write.csv(lcn_sample, file = "lcn_sample.csv")
Try the regression on the sample
##fit2 <-lm( MEASURE~ as.factor(UrbRur) + as.factor(Educ) + as.factor(Wealth), data = lcn_sample)
##lm( MEASURE~ as.factor(UrbRur) + as.factor(Educ) + as.factor(Wealth), data = lcn_sample)
Try regression without saving it
##lm( MEASURE~ as.factor(UrbRur) + as.factor(Educ) + as.factor(Wealth), data = lcn_sample)