2. Análisis exploratorio en R

#1.CARGAR DATOS

data("USArrests")
?USArrests
## starting httpd help server ... done
data<-USArrests

View(data)

#2.EXPLORACIÓN DE DATA (EDA)

class(data) #identificando el tipo de objeto
## [1] "data.frame"
nrow(data) #numero de filas
## [1] 50
ncol(data) #numero de columnas
## [1] 4
dim(data) #dimensión de mi data(un resumen de la # de filas y columnas)
## [1] 50  4
          #tamaño de data

names(data) #nombres de variables
## [1] "Murder"   "Assault"  "UrbanPop" "Rape"
colnames(data) #alternativa de nombre de variables
## [1] "Murder"   "Assault"  "UrbanPop" "Rape"
head(data) #6 primeros casos de mi data
##            Murder Assault UrbanPop Rape
## Alabama      13.2     236       58 21.2
## Alaska       10.0     263       48 44.5
## Arizona       8.1     294       80 31.0
## Arkansas      8.8     190       50 19.5
## California    9.0     276       91 40.6
## Colorado      7.9     204       78 38.7
tail(data) #6 últimos casos de mi data
##               Murder Assault UrbanPop Rape
## Vermont          2.2      48       32 11.2
## Virginia         8.5     156       63 20.7
## Washington       4.0     145       73 26.2
## West Virginia    5.7      81       39  9.3
## Wisconsin        2.6      53       66 10.8
## Wyoming          6.8     161       60 15.6
attributes(data) #atributos de mi data
## $names
## [1] "Murder"   "Assault"  "UrbanPop" "Rape"    
## 
## $class
## [1] "data.frame"
## 
## $row.names
##  [1] "Alabama"        "Alaska"         "Arizona"        "Arkansas"      
##  [5] "California"     "Colorado"       "Connecticut"    "Delaware"      
##  [9] "Florida"        "Georgia"        "Hawaii"         "Idaho"         
## [13] "Illinois"       "Indiana"        "Iowa"           "Kansas"        
## [17] "Kentucky"       "Louisiana"      "Maine"          "Maryland"      
## [21] "Massachusetts"  "Michigan"       "Minnesota"      "Mississippi"   
## [25] "Missouri"       "Montana"        "Nebraska"       "Nevada"        
## [29] "New Hampshire"  "New Jersey"     "New Mexico"     "New York"      
## [33] "North Carolina" "North Dakota"   "Ohio"           "Oklahoma"      
## [37] "Oregon"         "Pennsylvania"   "Rhode Island"   "South Carolina"
## [41] "South Dakota"   "Tennessee"      "Texas"          "Utah"          
## [45] "Vermont"        "Virginia"       "Washington"     "West Virginia" 
## [49] "Wisconsin"      "Wyoming"

#3.OBSERVACION Y EXPLORACION DE FILAS Y COLUMNAS

#FILAS

data[15,] #observando mi caso 15
##      Murder Assault UrbanPop Rape
## Iowa    2.2      56       57 11.3
data[c(26:30),] #un intervalo de casos
##               Murder Assault UrbanPop Rape
## Montana          6.0     109       53 16.4
## Nebraska         4.3     102       62 16.5
## Nevada          12.2     252       81 46.0
## New Hampshire    2.1      57       56  9.5
## New Jersey       7.4     159       89 18.8
fila15<-data[15,] #creando una bd de solo un caso
fila15
##      Murder Assault UrbanPop Rape
## Iowa    2.2      56       57 11.3
fila26_27_28_29_30<-data[c(26:30),] #generando un subconjunto de datos
fila26_27_28_29_30
##               Murder Assault UrbanPop Rape
## Montana          6.0     109       53 16.4
## Nebraska         4.3     102       62 16.5
## Nevada          12.2     252       81 46.0
## New Hampshire    2.1      57       56  9.5
## New Jersey       7.4     159       89 18.8
fila1_2_5<-data[c(1,2,5),]
fila1_2_5
##            Murder Assault UrbanPop Rape
## Alabama      13.2     236       58 21.2
## Alaska       10.0     263       48 44.5
## California    9.0     276       91 40.6
fila_Alabama <-data["Alabama",]
fila_Alabama
##         Murder Assault UrbanPop Rape
## Alabama   13.2     236       58 21.2
data[c("Alabama","Montana"),]
##         Murder Assault UrbanPop Rape
## Alabama   13.2     236       58 21.2
## Montana    6.0     109       53 16.4
data[c(1,26),]
##         Murder Assault UrbanPop Rape
## Alabama   13.2     236       58 21.2
## Montana    6.0     109       53 16.4
data[c(-3,-6),] #eliminando casos
##                Murder Assault UrbanPop Rape
## Alabama          13.2     236       58 21.2
## Alaska           10.0     263       48 44.5
## Arkansas          8.8     190       50 19.5
## California        9.0     276       91 40.6
## Connecticut       3.3     110       77 11.1
## Delaware          5.9     238       72 15.8
## Florida          15.4     335       80 31.9
## Georgia          17.4     211       60 25.8
## Hawaii            5.3      46       83 20.2
## Idaho             2.6     120       54 14.2
## Illinois         10.4     249       83 24.0
## Indiana           7.2     113       65 21.0
## Iowa              2.2      56       57 11.3
## Kansas            6.0     115       66 18.0
## Kentucky          9.7     109       52 16.3
## Louisiana        15.4     249       66 22.2
## Maine             2.1      83       51  7.8
## Maryland         11.3     300       67 27.8
## Massachusetts     4.4     149       85 16.3
## Michigan         12.1     255       74 35.1
## Minnesota         2.7      72       66 14.9
## Mississippi      16.1     259       44 17.1
## Missouri          9.0     178       70 28.2
## Montana           6.0     109       53 16.4
## Nebraska          4.3     102       62 16.5
## Nevada           12.2     252       81 46.0
## New Hampshire     2.1      57       56  9.5
## New Jersey        7.4     159       89 18.8
## New Mexico       11.4     285       70 32.1
## New York         11.1     254       86 26.1
## North Carolina   13.0     337       45 16.1
## North Dakota      0.8      45       44  7.3
## Ohio              7.3     120       75 21.4
## Oklahoma          6.6     151       68 20.0
## Oregon            4.9     159       67 29.3
## Pennsylvania      6.3     106       72 14.9
## Rhode Island      3.4     174       87  8.3
## South Carolina   14.4     279       48 22.5
## South Dakota      3.8      86       45 12.8
## Tennessee        13.2     188       59 26.9
## Texas            12.7     201       80 25.5
## Utah              3.2     120       80 22.9
## Vermont           2.2      48       32 11.2
## Virginia          8.5     156       63 20.7
## Washington        4.0     145       73 26.2
## West Virginia     5.7      81       39  9.3
## Wisconsin         2.6      53       66 10.8
## Wyoming           6.8     161       60 15.6
fila_menos_3_6<-data[c(-3,-6),]
fila_menos_3_6
##                Murder Assault UrbanPop Rape
## Alabama          13.2     236       58 21.2
## Alaska           10.0     263       48 44.5
## Arkansas          8.8     190       50 19.5
## California        9.0     276       91 40.6
## Connecticut       3.3     110       77 11.1
## Delaware          5.9     238       72 15.8
## Florida          15.4     335       80 31.9
## Georgia          17.4     211       60 25.8
## Hawaii            5.3      46       83 20.2
## Idaho             2.6     120       54 14.2
## Illinois         10.4     249       83 24.0
## Indiana           7.2     113       65 21.0
## Iowa              2.2      56       57 11.3
## Kansas            6.0     115       66 18.0
## Kentucky          9.7     109       52 16.3
## Louisiana        15.4     249       66 22.2
## Maine             2.1      83       51  7.8
## Maryland         11.3     300       67 27.8
## Massachusetts     4.4     149       85 16.3
## Michigan         12.1     255       74 35.1
## Minnesota         2.7      72       66 14.9
## Mississippi      16.1     259       44 17.1
## Missouri          9.0     178       70 28.2
## Montana           6.0     109       53 16.4
## Nebraska          4.3     102       62 16.5
## Nevada           12.2     252       81 46.0
## New Hampshire     2.1      57       56  9.5
## New Jersey        7.4     159       89 18.8
## New Mexico       11.4     285       70 32.1
## New York         11.1     254       86 26.1
## North Carolina   13.0     337       45 16.1
## North Dakota      0.8      45       44  7.3
## Ohio              7.3     120       75 21.4
## Oklahoma          6.6     151       68 20.0
## Oregon            4.9     159       67 29.3
## Pennsylvania      6.3     106       72 14.9
## Rhode Island      3.4     174       87  8.3
## South Carolina   14.4     279       48 22.5
## South Dakota      3.8      86       45 12.8
## Tennessee        13.2     188       59 26.9
## Texas            12.7     201       80 25.5
## Utah              3.2     120       80 22.9
## Vermont           2.2      48       32 11.2
## Virginia          8.5     156       63 20.7
## Washington        4.0     145       73 26.2
## West Virginia     5.7      81       39  9.3
## Wisconsin         2.6      53       66 10.8
## Wyoming           6.8     161       60 15.6
head(fila_menos_3_6)
##             Murder Assault UrbanPop Rape
## Alabama       13.2     236       58 21.2
## Alaska        10.0     263       48 44.5
## Arkansas       8.8     190       50 19.5
## California     9.0     276       91 40.6
## Connecticut    3.3     110       77 11.1
## Delaware       5.9     238       72 15.8
tail(fila_menos_3_6)
##               Murder Assault UrbanPop Rape
## Vermont          2.2      48       32 11.2
## Virginia         8.5     156       63 20.7
## Washington       4.0     145       73 26.2
## West Virginia    5.7      81       39  9.3
## Wisconsin        2.6      53       66 10.8
## Wyoming          6.8     161       60 15.6

#COLUMNAS

data[,4] #observando los casos de la variabe 
##  [1] 21.2 44.5 31.0 19.5 40.6 38.7 11.1 15.8 31.9 25.8 20.2 14.2 24.0 21.0 11.3
## [16] 18.0 16.3 22.2  7.8 27.8 16.3 35.1 14.9 17.1 28.2 16.4 16.5 46.0  9.5 18.8
## [31] 32.1 26.1 16.1  7.3 21.4 20.0 29.3 14.9  8.3 22.5 12.8 26.9 25.5 22.9 11.2
## [46] 20.7 26.2  9.3 10.8 15.6
data[,1]
##  [1] 13.2 10.0  8.1  8.8  9.0  7.9  3.3  5.9 15.4 17.4  5.3  2.6 10.4  7.2  2.2
## [16]  6.0  9.7 15.4  2.1 11.3  4.4 12.1  2.7 16.1  9.0  6.0  4.3 12.2  2.1  7.4
## [31] 11.4 11.1 13.0  0.8  7.3  6.6  4.9  6.3  3.4 14.4  3.8 13.2 12.7  3.2  2.2
## [46]  8.5  4.0  5.7  2.6  6.8
data[,c(2:4)] #observando un intervalo de variables
##                Assault UrbanPop Rape
## Alabama            236       58 21.2
## Alaska             263       48 44.5
## Arizona            294       80 31.0
## Arkansas           190       50 19.5
## California         276       91 40.6
## Colorado           204       78 38.7
## Connecticut        110       77 11.1
## Delaware           238       72 15.8
## Florida            335       80 31.9
## Georgia            211       60 25.8
## Hawaii              46       83 20.2
## Idaho              120       54 14.2
## Illinois           249       83 24.0
## Indiana            113       65 21.0
## Iowa                56       57 11.3
## Kansas             115       66 18.0
## Kentucky           109       52 16.3
## Louisiana          249       66 22.2
## Maine               83       51  7.8
## Maryland           300       67 27.8
## Massachusetts      149       85 16.3
## Michigan           255       74 35.1
## Minnesota           72       66 14.9
## Mississippi        259       44 17.1
## Missouri           178       70 28.2
## Montana            109       53 16.4
## Nebraska           102       62 16.5
## Nevada             252       81 46.0
## New Hampshire       57       56  9.5
## New Jersey         159       89 18.8
## New Mexico         285       70 32.1
## New York           254       86 26.1
## North Carolina     337       45 16.1
## North Dakota        45       44  7.3
## Ohio               120       75 21.4
## Oklahoma           151       68 20.0
## Oregon             159       67 29.3
## Pennsylvania       106       72 14.9
## Rhode Island       174       87  8.3
## South Carolina     279       48 22.5
## South Dakota        86       45 12.8
## Tennessee          188       59 26.9
## Texas              201       80 25.5
## Utah               120       80 22.9
## Vermont             48       32 11.2
## Virginia           156       63 20.7
## Washington         145       73 26.2
## West Virginia       81       39  9.3
## Wisconsin           53       66 10.8
## Wyoming            161       60 15.6
data$Rape
##  [1] 21.2 44.5 31.0 19.5 40.6 38.7 11.1 15.8 31.9 25.8 20.2 14.2 24.0 21.0 11.3
## [16] 18.0 16.3 22.2  7.8 27.8 16.3 35.1 14.9 17.1 28.2 16.4 16.5 46.0  9.5 18.8
## [31] 32.1 26.1 16.1  7.3 21.4 20.0 29.3 14.9  8.3 22.5 12.8 26.9 25.5 22.9 11.2
## [46] 20.7 26.2  9.3 10.8 15.6
data$Rape[c((1:5),8)] #pidiendo los casos 1,2,3,4,5,8 de la variable rape
## [1] 21.2 44.5 31.0 19.5 40.6 15.8
data$Rape[c(1,2,3,4,5,8)]
## [1] 21.2 44.5 31.0 19.5 40.6 15.8
data[12,4]
## [1] 14.2
data[12,3]
## [1] 54