##Prerequisites:
library(vip)
Attaching package: ‘vip’
The following object is masked from ‘package:utils’:
vi
##Data
boston <- read_csv("boston.csv")
Rows: 506 Columns: 16── Column specification ────────────────────
Delimiter: ","
dbl (16): lon, lat, cmedv, crim, zn, ind...
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
##Split the data into a test and training set(70-30 split)
test <- testing(spl)
Error: object 'spl' not found
##Check predictor variables correlation
cmedv_cor <- corr_train[ , c("cmedv")] boston_correlation <- cor(boston)
Error: unexpected symbol in "cmedv_cor <- corr_train[ , c("cmedv")] boston_correlation"
##rm has the strongest positive correlation
##Plot the relationship between cmedv and rm

##Train a simple linear regression model with the predictor
variables
##Compute the generalization RMSE for the above model
#Part 2: Multiple Linear Regression
##Compute the generalization RMSE for the model with all predictor
variables.
##Using the full model with all predictor variables, identify the top
5 most influential predictor variables in our model.

LS0tDQp0aXRsZTogIlIgTm90ZWJvb2siDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQojI1ByZXJlcXVpc2l0ZXM6DQoNCmBgYHtyfQ0KbGlicmFyeSh0aWR5dmVyc2UpDQpsaWJyYXJ5KHRpZHltb2RlbHMpDQpsaWJyYXJ5KHJlYWRyKQ0KbGlicmFyeSh2aXApDQpgYGANCg0KIyNEYXRhDQoNCmBgYHtyfQ0KYm9zdG9uIDwtIHJlYWRfY3N2KCJib3N0b24uY3N2IikNCmBgYA0KDQojI1NwbGl0IHRoZSBkYXRhIGludG8gYSB0ZXN0IGFuZCB0cmFpbmluZyBzZXQoNzAtMzAgc3BsaXQpDQpgYGB7cn0NCnNldC5zZWVkKDEyMykNCnNwbGl0IDwtIGluaXRpYWxfc3BsaXQoYm9zdG9uLCBwcm9wID0gMC43LCBzdHJhdGEgPSBjbWVkdikNCnRyYWluIDwtIHRyYWluaW5nKHNwbGl0KQ0KdGVzdCA8LSB0ZXN0aW5nKHNwbGl0KQ0KYGBgDQoNCiMjQ2hlY2sgcHJlZGljdG9yIHZhcmlhYmxlcyBjb3JyZWxhdGlvbg0KDQpgYGB7cn0NCg0KY29ycl90cmFpbiA8LSBjb3IodHJhaW4pDQoNCmNtZWR2X2NvciA8LSBjb3JyX3RyYWluWyAsIGMoImNtZWR2IildIGJvc3Rvbl9jb3JyZWxhdGlvbiA8LSBjb3IoYm9zdG9uKQ0KYm9zdG9uX2NvcnJlbGF0aW9uDQpgYGANCmBgYHtyfQ0KYm9zdG9uICU+JQ0KICBzZWxlY3RfaWYoaXMubnVtZXJpYykgJT4lDQogIGNvcigpICU+JQ0KICBhcy5kYXRhLmZyYW1lKCkgJT4lDQogIHNlbGVjdChjbWVkdikNCmBgYA0KDQoNCiMjcm0gaGFzIHRoZSBzdHJvbmdlc3QgcG9zaXRpdmUgY29ycmVsYXRpb24NCg0KIyNQbG90IHRoZSByZWxhdGlvbnNoaXAgYmV0d2VlbiBjbWVkdiBhbmQgcm0NCg0KYGBge3J9DQp0cmFpbiAlPiUNCiAgZ2dwbG90KGFlcyhjbWVkdiwgcm0pKSArDQogIGdlb21fcG9pbnQoYWxwaGEgPSAwLjIpICsNCiAgZ2VvbV9zbW9vdGgobWV0aG9kID0gImxtIiwgc2UgPSBGQUxTRSkNCmBgYA0KDQojI1RyYWluIGEgc2ltcGxlIGxpbmVhciByZWdyZXNzaW9uIG1vZGVsIHdpdGggdGhlIHByZWRpY3RvciB2YXJpYWJsZXMNCg0KYGBge3J9DQpib3N0b25fbW9kZWwgPC0gbGluZWFyX3JlZygpICU+JQ0KICBmaXQoY21lZHYgfiBybSwgZGF0YSA9IHRyYWluKQ0KdGlkeShib3N0b25fbW9kZWwpDQpgYGANCg0KIyNDb21wdXRlIHRoZSBnZW5lcmFsaXphdGlvbiBSTVNFIGZvciB0aGUgYWJvdmUgbW9kZWwNCg0KYGBge3J9DQpib3N0b25fbW9kZWwgJT4lDQogIHByZWRpY3QodGVzdCkgJT4lDQogIGJpbmRfY29scyh0ZXN0KSAlPiUNCiAgcm1zZSh0cnV0aCA9IGNtZWR2LCBlc3RpbWF0ZSA9IC5wcmVkKQ0KYGBgDQojUGFydCAyOiBNdWx0aXBsZSBMaW5lYXIgUmVncmVzc2lvbg0KDQpgYGB7cn0NCmJvc19tb2RlIDwtIGxpbmVhcl9yZWcoKSAlPiUNCiAgZml0KGNtZWR2IH4gLiwgZGF0YSA9IHRyYWluKQ0KdGlkeShib3NfbW9kZSkNCg0KY29uZmludChib3NfbW9kZSRmaXQpDQpgYGANCiMjQ29tcHV0ZSB0aGUgZ2VuZXJhbGl6YXRpb24gUk1TRSBmb3IgdGhlIG1vZGVsIHdpdGggYWxsIHByZWRpY3RvciB2YXJpYWJsZXMuIA0KDQpgYGB7cn0NCmJvc19tb2RlICU+JQ0KICBwcmVkaWN0KHRlc3QpICU+JQ0KICBiaW5kX2NvbHModGVzdCkgJT4lDQogIHJtc2UodHJ1dGggPSBjbWVkdiwgZXN0aW1hdGUgPSAucHJlZCkNCg0KYGBgDQoNCiMjVXNpbmcgdGhlIGZ1bGwgbW9kZWwgd2l0aCBhbGwgcHJlZGljdG9yIHZhcmlhYmxlcywgaWRlbnRpZnkgdGhlIHRvcCA1IG1vc3QgaW5mbHVlbnRpYWwgcHJlZGljdG9yIHZhcmlhYmxlcyBpbiBvdXIgbW9kZWwuDQoNCmBgYHtyfQ0KYm9zX21vZGUgJT4lDQogIHZpcDo6dmlwKDUpDQpgYGA=