Teoría

Una Red Neuronal Artificial (ANN) modela la relación entre un conjunto de entradas y una salida, resolviendo un problema de aprendizaje.

Instalar paquetes y llamar librerías

#install.packages("neuralnet") # Redes Neuronales
library(neuralnet)
#install.packages("caret") # Entrenamiento de ML
library(caret)
#install.packages("ggplot2")
library(ggplot2)

Importar la base de datos

boston_borrador <- read.csv("/Users/osvaldotello/Desktop/BostonHousing.csv")
boston <- as.data.frame(scale(boston_borrador))

Entender la base de datos

summary(boston)
##       crim                 zn               indus              chas        
##  Min.   :-0.419367   Min.   :-0.48724   Min.   :-1.5563   Min.   :-0.2723  
##  1st Qu.:-0.410563   1st Qu.:-0.48724   1st Qu.:-0.8668   1st Qu.:-0.2723  
##  Median :-0.390280   Median :-0.48724   Median :-0.2109   Median :-0.2723  
##  Mean   : 0.000000   Mean   : 0.00000   Mean   : 0.0000   Mean   : 0.0000  
##  3rd Qu.: 0.007389   3rd Qu.: 0.04872   3rd Qu.: 1.0150   3rd Qu.:-0.2723  
##  Max.   : 9.924110   Max.   : 3.80047   Max.   : 2.4202   Max.   : 3.6648  
##       nox                rm               age               dis         
##  Min.   :-1.4644   Min.   :-3.8764   Min.   :-2.3331   Min.   :-1.2658  
##  1st Qu.:-0.9121   1st Qu.:-0.5681   1st Qu.:-0.8366   1st Qu.:-0.8049  
##  Median :-0.1441   Median :-0.1084   Median : 0.3171   Median :-0.2790  
##  Mean   : 0.0000   Mean   : 0.0000   Mean   : 0.0000   Mean   : 0.0000  
##  3rd Qu.: 0.5981   3rd Qu.: 0.4823   3rd Qu.: 0.9059   3rd Qu.: 0.6617  
##  Max.   : 2.7296   Max.   : 3.5515   Max.   : 1.1164   Max.   : 3.9566  
##       rad               tax             ptratio              b          
##  Min.   :-0.9819   Min.   :-1.3127   Min.   :-2.7047   Min.   :-3.9033  
##  1st Qu.:-0.6373   1st Qu.:-0.7668   1st Qu.:-0.4876   1st Qu.: 0.2049  
##  Median :-0.5225   Median :-0.4642   Median : 0.2746   Median : 0.3808  
##  Mean   : 0.0000   Mean   : 0.0000   Mean   : 0.0000   Mean   : 0.0000  
##  3rd Qu.: 1.6596   3rd Qu.: 1.5294   3rd Qu.: 0.8058   3rd Qu.: 0.4332  
##  Max.   : 1.6596   Max.   : 1.7964   Max.   : 1.6372   Max.   : 0.4406  
##      lstat              medv        
##  Min.   :-1.5296   Min.   :-1.9063  
##  1st Qu.:-0.7986   1st Qu.:-0.5989  
##  Median :-0.1811   Median :-0.1449  
##  Mean   : 0.0000   Mean   : 0.0000  
##  3rd Qu.: 0.6024   3rd Qu.: 0.2683  
##  Max.   : 3.5453   Max.   : 2.9865
str(boston)
## 'data.frame':    506 obs. of  14 variables:
##  $ crim   : num  -0.419 -0.417 -0.417 -0.416 -0.412 ...
##  $ zn     : num  0.285 -0.487 -0.487 -0.487 -0.487 ...
##  $ indus  : num  -1.287 -0.593 -0.593 -1.306 -1.306 ...
##  $ chas   : num  -0.272 -0.272 -0.272 -0.272 -0.272 ...
##  $ nox    : num  -0.144 -0.74 -0.74 -0.834 -0.834 ...
##  $ rm     : num  0.413 0.194 1.281 1.015 1.227 ...
##  $ age    : num  -0.12 0.367 -0.266 -0.809 -0.511 ...
##  $ dis    : num  0.14 0.557 0.557 1.077 1.077 ...
##  $ rad    : num  -0.982 -0.867 -0.867 -0.752 -0.752 ...
##  $ tax    : num  -0.666 -0.986 -0.986 -1.105 -1.105 ...
##  $ ptratio: num  -1.458 -0.303 -0.303 0.113 0.113 ...
##  $ b      : num  0.441 0.441 0.396 0.416 0.441 ...
##  $ lstat  : num  -1.074 -0.492 -1.208 -1.36 -1.025 ...
##  $ medv   : num  0.16 -0.101 1.323 1.182 1.486 ...
head(boston)
##         crim         zn      indus       chas        nox        rm        age
## 1 -0.4193669  0.2845483 -1.2866362 -0.2723291 -0.1440749 0.4132629 -0.1198948
## 2 -0.4169267 -0.4872402 -0.5927944 -0.2723291 -0.7395304 0.1940824  0.3668034
## 3 -0.4169290 -0.4872402 -0.5927944 -0.2723291 -0.7395304 1.2814456 -0.2655490
## 4 -0.4163384 -0.4872402 -1.3055857 -0.2723291 -0.8344581 1.0152978 -0.8090878
## 5 -0.4120741 -0.4872402 -1.3055857 -0.2723291 -0.8344581 1.2273620 -0.5106743
## 6 -0.4166314 -0.4872402 -1.3055857 -0.2723291 -0.8344581 0.2068916 -0.3508100
##        dis        rad        tax    ptratio         b      lstat       medv
## 1 0.140075 -0.9818712 -0.6659492 -1.4575580 0.4406159 -1.0744990  0.1595278
## 2 0.556609 -0.8670245 -0.9863534 -0.3027945 0.4406159 -0.4919525 -0.1014239
## 3 0.556609 -0.8670245 -0.9863534 -0.3027945 0.3960351 -1.2075324  1.3229375
## 4 1.076671 -0.7521778 -1.1050216  0.1129203 0.4157514 -1.3601708  1.1815886
## 5 1.076671 -0.7521778 -1.1050216  0.1129203 0.4406159 -1.0254866  1.4860323
## 6 1.076671 -0.7521778 -1.1050216  0.1129203 0.4101651 -1.0422909  0.6705582

Partir la base de datos

set.seed(123)
renglones_entrenamiento_boston <- createDataPartition(boston_borrador$medv, p=0.8, list=FALSE)
entrenamiento_boston <- boston[renglones_entrenamiento_boston, ]
prueba_boston <- boston[-renglones_entrenamiento_boston, ]

Generar el Modelo

modelo_boston <-neuralnet(medv ~ ., data=entrenamiento_boston, linear.output=TRUE, stepmax=1e6)
plot(modelo_boston)

Predecir con la Red Neuronal

prediccion <- compute(modelo_boston, prueba_boston[, -which(names(prueba_boston) == "medv")])$net.result
real <- prueba_boston$medv
  
boston_resultados <- data.frame(Real = real, Predicción = prediccion)

ggplot(boston_resultados, aes(x=Real, y=Predicción)) +
  geom_point(color="blue") +
  geom_abline(slope=1, intercept=0, color="red") +
  theme_minimal() +
  ggtitle("Predicción vs. Valores Reales")

LS0tCnRpdGxlOiAiQm9zdG9uIgphdXRob3I6ICJPc3ZhbGRvIFRlbGxvIC0gQTAxMjg1NjQyIgpkYXRlOiAiMjAyNS0wMy0wMiIKb3V0cHV0OiAKICBodG1sX2RvY3VtZW50OgogICAgdG9jOiBUUlVFCiAgICB0b2NfZmxvYXQ6IFRSVUUKICAgIGNvZGVfZG93bmxvYWQ6IFRSVUUKICAgIHRoZW1lOiAic3BhY2VsYWIiCiAgICBoaWdobGlnaHQ6ICJrYXRlIgotLS0KCiFbXSgvVXNlcnMvb3N2YWxkb3RlbGxvL0Rlc2t0b3AvYm9zdG9uLW1hc3NhY2h1c2V0dHMtQk9TVE9OVEcwMjIxLTcxOWFlZjJlZWIxYzQ5MjliNmM4Mzk3MTVlMzRhNjllLmpwZykKCiMgPHNwYW4gc3R5bGU9ImNvbG9yOiByZWQ7Ij5UZW9yw61hPC9zcGFuPgpVbmEgKipSZWQgTmV1cm9uYWwgQXJ0aWZpY2lhbCAoQU5OKSoqIG1vZGVsYSBsYSByZWxhY2nDs24gZW50cmUgdW4gY29uanVudG8gZGUgZW50cmFkYXMgeSB1bmEgc2FsaWRhLCByZXNvbHZpZW5kbyB1biBwcm9ibGVtYSBkZSBhcHJlbmRpemFqZS4gIAoKIyA8c3BhbiBzdHlsZT0iY29sb3I6IHJlZDsiPkluc3RhbGFyIHBhcXVldGVzIHkgbGxhbWFyIGxpYnJlcsOtYXM8L3NwYW4+CmBgYHtyIG1lc3NhZ2U9RkFMU0UsIHdhcm5pbmc9RkFMU0V9CiNpbnN0YWxsLnBhY2thZ2VzKCJuZXVyYWxuZXQiKSAjIFJlZGVzIE5ldXJvbmFsZXMKbGlicmFyeShuZXVyYWxuZXQpCiNpbnN0YWxsLnBhY2thZ2VzKCJjYXJldCIpICMgRW50cmVuYW1pZW50byBkZSBNTApsaWJyYXJ5KGNhcmV0KQojaW5zdGFsbC5wYWNrYWdlcygiZ2dwbG90MiIpCmxpYnJhcnkoZ2dwbG90MikKYGBgCgojIDxzcGFuIHN0eWxlPSJjb2xvcjogcmVkOyI+SW1wb3J0YXIgbGEgYmFzZSBkZSBkYXRvczwvc3Bhbj4KYGBge3J9CmJvc3Rvbl9ib3JyYWRvciA8LSByZWFkLmNzdigiL1VzZXJzL29zdmFsZG90ZWxsby9EZXNrdG9wL0Jvc3RvbkhvdXNpbmcuY3N2IikKYm9zdG9uIDwtIGFzLmRhdGEuZnJhbWUoc2NhbGUoYm9zdG9uX2JvcnJhZG9yKSkKYGBgCgojIDxzcGFuIHN0eWxlPSJjb2xvcjogcmVkOyI+RW50ZW5kZXIgbGEgYmFzZSBkZSBkYXRvczwvc3Bhbj4KYGBge3J9CnN1bW1hcnkoYm9zdG9uKQpzdHIoYm9zdG9uKQpoZWFkKGJvc3RvbikKYGBgCgojIDxzcGFuIHN0eWxlPSJjb2xvcjogcmVkOyI+UGFydGlyIGxhIGJhc2UgZGUgZGF0b3M8L3NwYW4+CmBgYHtyfQpzZXQuc2VlZCgxMjMpCnJlbmdsb25lc19lbnRyZW5hbWllbnRvX2Jvc3RvbiA8LSBjcmVhdGVEYXRhUGFydGl0aW9uKGJvc3Rvbl9ib3JyYWRvciRtZWR2LCBwPTAuOCwgbGlzdD1GQUxTRSkKZW50cmVuYW1pZW50b19ib3N0b24gPC0gYm9zdG9uW3Jlbmdsb25lc19lbnRyZW5hbWllbnRvX2Jvc3RvbiwgXQpwcnVlYmFfYm9zdG9uIDwtIGJvc3RvblstcmVuZ2xvbmVzX2VudHJlbmFtaWVudG9fYm9zdG9uLCBdCmBgYAoKIyA8c3BhbiBzdHlsZT0iY29sb3I6IHJlZDsiPkdlbmVyYXIgZWwgTW9kZWxvPC9zcGFuPgpgYGB7cn0KbW9kZWxvX2Jvc3RvbiA8LW5ldXJhbG5ldChtZWR2IH4gLiwgZGF0YT1lbnRyZW5hbWllbnRvX2Jvc3RvbiwgbGluZWFyLm91dHB1dD1UUlVFLCBzdGVwbWF4PTFlNikKcGxvdChtb2RlbG9fYm9zdG9uKQpgYGAKCiMgPHNwYW4gc3R5bGU9ImNvbG9yOiByZWQ7Ij5QcmVkZWNpciBjb24gbGEgUmVkIE5ldXJvbmFsPC9zcGFuPgpgYGB7cn0KcHJlZGljY2lvbiA8LSBjb21wdXRlKG1vZGVsb19ib3N0b24sIHBydWViYV9ib3N0b25bLCAtd2hpY2gobmFtZXMocHJ1ZWJhX2Jvc3RvbikgPT0gIm1lZHYiKV0pJG5ldC5yZXN1bHQKcmVhbCA8LSBwcnVlYmFfYm9zdG9uJG1lZHYKICAKYm9zdG9uX3Jlc3VsdGFkb3MgPC0gZGF0YS5mcmFtZShSZWFsID0gcmVhbCwgUHJlZGljY2nDs24gPSBwcmVkaWNjaW9uKQoKZ2dwbG90KGJvc3Rvbl9yZXN1bHRhZG9zLCBhZXMoeD1SZWFsLCB5PVByZWRpY2Npw7NuKSkgKwogIGdlb21fcG9pbnQoY29sb3I9ImJsdWUiKSArCiAgZ2VvbV9hYmxpbmUoc2xvcGU9MSwgaW50ZXJjZXB0PTAsIGNvbG9yPSJyZWQiKSArCiAgdGhlbWVfbWluaW1hbCgpICsKICBnZ3RpdGxlKCJQcmVkaWNjacOzbiB2cy4gVmFsb3JlcyBSZWFsZXMiKQpgYGAKCg==