library(readxl)
housing.df <- read.csv("BostonHousing.csv")
View(housing.df)
dim(housing.df)
## [1] 506  15
summary(housing.df)
##       CRIM                ZN             INDUS            CHAS        
##  Min.   : 0.00632   Min.   :  0.00   Min.   : 0.46   Min.   :0.00000  
##  1st Qu.: 0.08205   1st Qu.:  0.00   1st Qu.: 5.19   1st Qu.:0.00000  
##  Median : 0.25651   Median :  0.00   Median : 9.69   Median :0.00000  
##  Mean   : 3.61352   Mean   : 11.36   Mean   :11.14   Mean   :0.06917  
##  3rd Qu.: 3.67708   3rd Qu.: 12.50   3rd Qu.:18.10   3rd Qu.:0.00000  
##  Max.   :88.97620   Max.   :100.00   Max.   :27.74   Max.   :1.00000  
##       NOX               RM             AGE              DIS        
##  Min.   :0.3850   Min.   :3.561   Min.   :  2.90   Min.   : 1.130  
##  1st Qu.:0.4490   1st Qu.:5.886   1st Qu.: 45.02   1st Qu.: 2.100  
##  Median :0.5380   Median :6.208   Median : 77.50   Median : 3.207  
##  Mean   :0.5547   Mean   :6.285   Mean   : 68.57   Mean   : 3.795  
##  3rd Qu.:0.6240   3rd Qu.:6.623   3rd Qu.: 94.08   3rd Qu.: 5.188  
##  Max.   :0.8710   Max.   :8.780   Max.   :100.00   Max.   :12.127  
##       RAD              TAX           PTRATIO            B         
##  Min.   : 1.000   Min.   :187.0   Min.   :12.60   Min.   :  0.32  
##  1st Qu.: 4.000   1st Qu.:279.0   1st Qu.:17.40   1st Qu.:375.38  
##  Median : 5.000   Median :330.0   Median :19.05   Median :391.44  
##  Mean   : 9.549   Mean   :408.2   Mean   :18.46   Mean   :356.67  
##  3rd Qu.:24.000   3rd Qu.:666.0   3rd Qu.:20.20   3rd Qu.:396.23  
##  Max.   :24.000   Max.   :711.0   Max.   :22.00   Max.   :396.90  
##      LSTAT            MEDV         CAT..MEDV    
##  Min.   : 1.73   Min.   : 5.00   Min.   :0.000  
##  1st Qu.: 6.95   1st Qu.:17.02   1st Qu.:0.000  
##  Median :11.36   Median :21.20   Median :0.000  
##  Mean   :12.65   Mean   :22.53   Mean   :0.166  
##  3rd Qu.:16.95   3rd Qu.:25.00   3rd Qu.:0.000  
##  Max.   :37.97   Max.   :50.00   Max.   :1.000
library(psych)
## Warning: package 'psych' was built under R version 4.0.5
describe(housing.df)
##           vars   n   mean     sd median trimmed    mad    min    max  range
## CRIM         1 506   3.61   8.60   0.26    1.68   0.33   0.01  88.98  88.97
## ZN           2 506  11.36  23.32   0.00    5.08   0.00   0.00 100.00 100.00
## INDUS        3 506  11.14   6.86   9.69   10.93   9.37   0.46  27.74  27.28
## CHAS         4 506   0.07   0.25   0.00    0.00   0.00   0.00   1.00   1.00
## NOX          5 506   0.55   0.12   0.54    0.55   0.13   0.38   0.87   0.49
## RM           6 506   6.28   0.70   6.21    6.25   0.51   3.56   8.78   5.22
## AGE          7 506  68.57  28.15  77.50   71.20  28.98   2.90 100.00  97.10
## DIS          8 506   3.80   2.11   3.21    3.54   1.91   1.13  12.13  11.00
## RAD          9 506   9.55   8.71   5.00    8.73   2.97   1.00  24.00  23.00
## TAX         10 506 408.24 168.54 330.00  400.04 108.23 187.00 711.00 524.00
## PTRATIO     11 506  18.46   2.16  19.05   18.66   1.70  12.60  22.00   9.40
## B           12 506 356.67  91.29 391.44  383.17   8.09   0.32 396.90 396.58
## LSTAT       13 506  12.65   7.14  11.36   11.90   7.11   1.73  37.97  36.24
## MEDV        14 506  22.53   9.20  21.20   21.56   5.93   5.00  50.00  45.00
## CAT..MEDV   15 506   0.17   0.37   0.00    0.08   0.00   0.00   1.00   1.00
##            skew kurtosis   se
## CRIM       5.19    36.60 0.38
## ZN         2.21     3.95 1.04
## INDUS      0.29    -1.24 0.30
## CHAS       3.39     9.48 0.01
## NOX        0.72    -0.09 0.01
## RM         0.40     1.84 0.03
## AGE       -0.60    -0.98 1.25
## DIS        1.01     0.46 0.09
## RAD        1.00    -0.88 0.39
## TAX        0.67    -1.15 7.49
## PTRATIO   -0.80    -0.30 0.10
## B         -2.87     7.10 4.06
## LSTAT      0.90     0.46 0.32
## MEDV       1.10     1.45 0.41
## CAT..MEDV  1.79     1.21 0.02
ftable(CHAS ~ RAD, data=housing.df)
##     CHAS   0   1
## RAD             
## 1         19   1
## 2         24   0
## 3         36   2
## 4        102   8
## 5        104  11
## 6         26   0
## 7         17   0
## 8         19   5
## 24       124   8
plot(housing.df)

plot(housing.df[,c(3,5,6,11,13,14)],pch=3)

cor(housing.df,housing.df$MV)
##                  CRIM          ZN       INDUS         CHAS         NOX
## CRIM       1.00000000 -0.20046922  0.40658341 -0.055891582  0.42097171
## ZN        -0.20046922  1.00000000 -0.53382819 -0.042696719 -0.51660371
## INDUS      0.40658341 -0.53382819  1.00000000  0.062938027  0.76365145
## CHAS      -0.05589158 -0.04269672  0.06293803  1.000000000  0.09120281
## NOX        0.42097171 -0.51660371  0.76365145  0.091202807  1.00000000
## RM        -0.21924670  0.31199059 -0.39167585  0.091251225 -0.30218819
## AGE        0.35273425 -0.56953734  0.64477851  0.086517774  0.73147010
## DIS       -0.37967009  0.66440822 -0.70802699 -0.099175780 -0.76923011
## RAD        0.62550515 -0.31194783  0.59512927 -0.007368241  0.61144056
## TAX        0.58276431 -0.31456332  0.72076018 -0.035586518  0.66802320
## PTRATIO    0.28994558 -0.39167855  0.38324756 -0.121515174  0.18893268
## B         -0.38506394  0.17552032 -0.35697654  0.048788485 -0.38005064
## LSTAT      0.45562148 -0.41299457  0.60379972 -0.053929298  0.59087892
## MEDV      -0.38830461  0.36044534 -0.48372516  0.175260177 -0.42732077
## CAT..MEDV -0.15198696  0.36529623 -0.36627559  0.108631150 -0.23250184
##                    RM         AGE         DIS          RAD         TAX
## CRIM      -0.21924670  0.35273425 -0.37967009  0.625505145  0.58276431
## ZN         0.31199059 -0.56953734  0.66440822 -0.311947826 -0.31456332
## INDUS     -0.39167585  0.64477851 -0.70802699  0.595129275  0.72076018
## CHAS       0.09125123  0.08651777 -0.09917578 -0.007368241 -0.03558652
## NOX       -0.30218819  0.73147010 -0.76923011  0.611440563  0.66802320
## RM         1.00000000 -0.24026493  0.20524621 -0.209846668 -0.29204783
## AGE       -0.24026493  1.00000000 -0.74788054  0.456022452  0.50645559
## DIS        0.20524621 -0.74788054  1.00000000 -0.494587930 -0.53443158
## RAD       -0.20984667  0.45602245 -0.49458793  1.000000000  0.91022819
## TAX       -0.29204783  0.50645559 -0.53443158  0.910228189  1.00000000
## PTRATIO   -0.35550149  0.26151501 -0.23247054  0.464741179  0.46085304
## B          0.12806864 -0.27353398  0.29151167 -0.444412816 -0.44180801
## LSTAT     -0.61380827  0.60233853 -0.49699583  0.488676335  0.54399341
## MEDV       0.69535995 -0.37695457  0.24992873 -0.381626231 -0.46853593
## CAT..MEDV  0.64126541 -0.19119589  0.11888651 -0.197924023 -0.27368672
##              PTRATIO           B      LSTAT       MEDV  CAT..MEDV
## CRIM       0.2899456 -0.38506394  0.4556215 -0.3883046 -0.1519870
## ZN        -0.3916785  0.17552032 -0.4129946  0.3604453  0.3652962
## INDUS      0.3832476 -0.35697654  0.6037997 -0.4837252 -0.3662756
## CHAS      -0.1215152  0.04878848 -0.0539293  0.1752602  0.1086312
## NOX        0.1889327 -0.38005064  0.5908789 -0.4273208 -0.2325018
## RM        -0.3555015  0.12806864 -0.6138083  0.6953599  0.6412654
## AGE        0.2615150 -0.27353398  0.6023385 -0.3769546 -0.1911959
## DIS       -0.2324705  0.29151167 -0.4969958  0.2499287  0.1188865
## RAD        0.4647412 -0.44441282  0.4886763 -0.3816262 -0.1979240
## TAX        0.4608530 -0.44180801  0.5439934 -0.4685359 -0.2736867
## PTRATIO    1.0000000 -0.17738330  0.3740443 -0.5077867 -0.4434247
## B         -0.1773833  1.00000000 -0.3660869  0.3334608  0.1551370
## LSTAT      0.3740443 -0.36608690  1.0000000 -0.7376627 -0.4699108
## MEDV      -0.5077867  0.33346082 -0.7376627  1.0000000  0.7897888
## CAT..MEDV -0.4434247  0.15513696 -0.4699108  0.7897888  1.0000000