PRACTICA NUMERO 4

Accidentes por mes

library (readr) # Libreria

bicis2017 <- read.csv("https://raw.githubusercontent.com/rpizarrog/Curso-Titulacion-Data-Science-/master/2019/Datos/AccidentesBicicletas_2017.csv", encoding = "UTF-8")

class(bicis2017)  # Devuelve el tipo de datos. Queremos un data.frame
## [1] "data.frame"
# VAMOS A TRABAJAR CON bicis2017

names(bicis2017) # El nombre de aributo de FECHA está extraño
##  [1] "X.U.FEFF.FECHA"     "RANGO.HORARIO"      "DIA.SEMANA"        
##  [4] "DISTRITO"           "LUGAR.ACCIDENTE"    "Nº"                
##  [7] "Nº.PARTE"           "CPFA.Granizo"       "CPFA.Hielo"        
## [10] "CPFA.Lluvia"        "CPFA.Niebla"        "CPFA.Seco"         
## [13] "CPFA.Nieve"         "CPSV.Mojada"        "CPSV.Aceite"       
## [16] "CPSV.Barro"         "CPSV.Grava.Suelta"  "CPSV.Hielo"        
## [19] "CPSV.Seca.Y.Limpia" "Nº.VICTIMAS.."      "TIPO.ACCIDENTE"    
## [22] "Tipo.Vehiculo"      "TIPO.PERSONA"       "SEXO"              
## [25] "LESIVIDAD"          "Tramo.Edad"
# Cambiamos el nombre de es atributo de bicis2017 y al 6, 7 y 20
columnas <- colnames(bicis2017)
columnas[1] <- "FECHA" # Cambia el nombre de columna
columnas[6] <- "NO" # Cambia el nombre de columna
columnas[7] <- "NO.PARTE" # Cambia el nombre de columna
columnas[20] <- "NO.VICTIMAS" # Cambia el nombre de columna
colnames(bicis2017) <- columnas
names(bicis2017) # Ahora como se ven los nombres de columnas
##  [1] "FECHA"              "RANGO.HORARIO"      "DIA.SEMANA"        
##  [4] "DISTRITO"           "LUGAR.ACCIDENTE"    "NO"                
##  [7] "NO.PARTE"           "CPFA.Granizo"       "CPFA.Hielo"        
## [10] "CPFA.Lluvia"        "CPFA.Niebla"        "CPFA.Seco"         
## [13] "CPFA.Nieve"         "CPSV.Mojada"        "CPSV.Aceite"       
## [16] "CPSV.Barro"         "CPSV.Grava.Suelta"  "CPSV.Hielo"        
## [19] "CPSV.Seca.Y.Limpia" "NO.VICTIMAS"        "TIPO.ACCIDENTE"    
## [22] "Tipo.Vehiculo"      "TIPO.PERSONA"       "SEXO"              
## [25] "LESIVIDAD"          "Tramo.Edad"

Cambiando el comando de la columna FECHA como date y agregando

una nueva columna llamda MES de tipo numerico, que define el numero de mes de la fecha

# Limpiar y depurar el campo FECHA
bicis2017$FECHA <- as.Date(bicis2017$FECHA, "%d/%m/%Y")
bicis2017$MES <- as.numeric(format(bicis2017$FECHA,format="%m"))

#Así quedaron los datos

#bicis2017

#Vamos a encontrar los accidentes por mes

enero <- subset(bicis2017, MES == 1)  # LOS DE ENERO
febrero <- subset(bicis2017, MES == 2)  # LOS DE FEBRERO
marzo <- subset(bicis2017, MES == 3)  # LOS DE MARZO
abril <- subset(bicis2017, MES == 4)  # LOS DE ABRIL
mayo <- subset(bicis2017, MES == 5)  # LOS DE MAYO
junio <- subset(bicis2017, MES == 6)  # LOS DE JUNIO
julio <- subset(bicis2017, MES == 7)  # LOS DE JULIO
agosto <- subset(bicis2017, MES == 8)  # LOS DE AGOSTO
septiembre <- subset(bicis2017, MES == 9)  # LOS DE SEPTIEMBRE
octubre <- subset(bicis2017, MES == 10)  # LOS DE OCTUBRE
noviembre <- subset(bicis2017, MES == 11)  # LOS DE NOVIEMBRE
diciembre <- subset(bicis2017, MES == 12)  # LOS DE DICIEMBRE

###Mostramos algunos meses, sólo el campo FECHA

# ENERO
enero$FECHA
##  [1] "2017-01-01" "2017-01-02" "2017-01-03" "2017-01-04" "2017-01-05"
##  [6] "2017-01-05" "2017-01-05" "2017-01-05" "2017-01-06" "2017-01-06"
## [11] "2017-01-07" "2017-01-07" "2017-01-07" "2017-01-08" "2017-01-08"
## [16] "2017-01-09" "2017-01-09" "2017-01-09" "2017-01-10" "2017-01-10"
## [21] "2017-01-10" "2017-01-12" "2017-01-12" "2017-01-12" "2017-01-12"
## [26] "2017-01-13" "2017-01-13" "2017-01-15" "2017-01-19" "2017-01-19"
## [31] "2017-01-20" "2017-01-20" "2017-01-21" "2017-01-21" "2017-01-22"
## [36] "2017-01-24" "2017-01-24" "2017-01-25" "2017-01-25" "2017-01-26"
## [41] "2017-01-26" "2017-01-27" "2017-01-29" "2017-01-31" "2017-01-31"
# FEBFRERO
febrero$FECHA
##  [1] "2017-02-01" "2017-02-02" "2017-02-02" "2017-02-02" "2017-02-03"
##  [6] "2017-02-03" "2017-02-03" "2017-02-04" "2017-02-04" "2017-02-05"
## [11] "2017-02-06" "2017-02-07" "2017-02-07" "2017-02-07" "2017-02-08"
## [16] "2017-02-09" "2017-02-10" "2017-02-10" "2017-02-10" "2017-02-12"
## [21] "2017-02-13" "2017-02-14" "2017-02-14" "2017-02-14" "2017-02-14"
## [26] "2017-02-15" "2017-02-15" "2017-02-16" "2017-02-16" "2017-02-17"
## [31] "2017-02-18" "2017-02-18" "2017-02-19" "2017-02-19" "2017-02-19"
## [36] "2017-02-20" "2017-02-22" "2017-02-24" "2017-02-25" "2017-02-25"
## [41] "2017-02-25" "2017-02-25" "2017-02-27" "2017-02-28" "2017-02-28"
## [46] "2017-02-28" "2017-02-28" "2017-02-28" "2017-02-28"
# MARZO
marzo$FECHA
##  [1] "2017-03-01" "2017-03-02" "2017-03-03" "2017-03-03" "2017-03-03"
##  [6] "2017-03-05" "2017-03-06" "2017-03-07" "2017-03-07" "2017-03-07"
## [11] "2017-03-07" "2017-03-08" "2017-03-08" "2017-03-08" "2017-03-09"
## [16] "2017-03-09" "2017-03-09" "2017-03-09" "2017-03-10" "2017-03-10"
## [21] "2017-03-10" "2017-03-10" "2017-03-10" "2017-03-10" "2017-03-10"
## [26] "2017-03-12" "2017-03-13" "2017-03-14" "2017-03-14" "2017-03-15"
## [31] "2017-03-15" "2017-03-16" "2017-03-16" "2017-03-17" "2017-03-17"
## [36] "2017-03-17" "2017-03-18" "2017-03-19" "2017-03-19" "2017-03-20"
## [41] "2017-03-20" "2017-03-20" "2017-03-21" "2017-03-21" "2017-03-21"
## [46] "2017-03-21" "2017-03-21" "2017-03-22" "2017-03-23" "2017-03-23"
## [51] "2017-03-24" "2017-03-25" "2017-03-26" "2017-03-27" "2017-03-28"
## [56] "2017-03-29" "2017-03-30" "2017-03-31" "2017-03-31" "2017-03-31"
# ABRIL
abril$FECHA
##  [1] "2017-04-01" "2017-04-02" "2017-04-02" "2017-04-02" "2017-04-03"
##  [6] "2017-04-03" "2017-04-04" "2017-04-05" "2017-04-05" "2017-04-06"
## [11] "2017-04-06" "2017-04-07" "2017-04-07" "2017-04-07" "2017-04-07"
## [16] "2017-04-07" "2017-04-07" "2017-04-08" "2017-04-09" "2017-04-09"
## [21] "2017-04-09" "2017-04-10" "2017-04-10" "2017-04-10" "2017-04-11"
## [26] "2017-04-12" "2017-04-12" "2017-04-12" "2017-04-13" "2017-04-13"
## [31] "2017-04-13" "2017-04-14" "2017-04-15" "2017-04-15" "2017-04-15"
## [36] "2017-04-15" "2017-04-16" "2017-04-17" "2017-04-20" "2017-04-21"
## [41] "2017-04-21" "2017-04-22" "2017-04-22" "2017-04-22" "2017-04-23"
## [46] "2017-04-23" "2017-04-23" "2017-04-23" "2017-04-24" "2017-04-24"
## [51] "2017-04-25" "2017-04-26" "2017-04-27" "2017-04-28"
# MAYO
mayo$FECHA
##  [1] "2017-05-01" "2017-05-01" "2017-05-01" "2017-05-02" "2017-05-02"
##  [6] "2017-05-03" "2017-05-03" "2017-05-04" "2017-05-04" "2017-05-04"
## [11] "2017-05-05" "2017-05-06" "2017-05-06" "2017-05-06" "2017-05-06"
## [16] "2017-05-07" "2017-05-07" "2017-05-07" "2017-05-07" "2017-05-07"
## [21] "2017-05-07" "2017-05-08" "2017-05-08" "2017-05-08" "2017-05-08"
## [26] "2017-05-09" "2017-05-09" "2017-05-09" "2017-05-09" "2017-05-10"
## [31] "2017-05-10" "2017-05-10" "2017-05-10" "2017-05-10" "2017-05-10"
## [36] "2017-05-11" "2017-05-12" "2017-05-12" "2017-05-12" "2017-05-12"
## [41] "2017-05-12" "2017-05-13" "2017-05-14" "2017-05-14" "2017-05-14"
## [46] "2017-05-17" "2017-05-17" "2017-05-18" "2017-05-18" "2017-05-19"
## [51] "2017-05-19" "2017-05-20" "2017-05-21" "2017-05-23" "2017-05-24"
## [56] "2017-05-24" "2017-05-24" "2017-05-25" "2017-05-25" "2017-05-25"
## [61] "2017-05-25" "2017-05-25" "2017-05-25" "2017-05-26" "2017-05-27"
## [66] "2017-05-27" "2017-05-28" "2017-05-28" "2017-05-29" "2017-05-29"
## [71] "2017-05-29" "2017-05-29" "2017-05-29" "2017-05-29" "2017-05-29"
## [76] "2017-05-29" "2017-05-30" "2017-05-30" "2017-05-30" "2017-05-31"
## [81] "2017-05-31" "2017-05-31"
# JUNIO
junio$FECHA
##  [1] "2017-06-01" "2017-06-01" "2017-06-01" "2017-06-02" "2017-06-02"
##  [6] "2017-06-03" "2017-06-03" "2017-06-03" "2017-06-03" "2017-06-03"
## [11] "2017-06-03" "2017-06-04" "2017-06-04" "2017-06-05" "2017-06-05"
## [16] "2017-06-06" "2017-06-06" "2017-06-06" "2017-06-06" "2017-06-06"
## [21] "2017-06-07" "2017-06-07" "2017-06-08" "2017-06-08" "2017-06-08"
## [26] "2017-06-09" "2017-06-10" "2017-06-10" "2017-06-11" "2017-06-12"
## [31] "2017-06-12" "2017-06-13" "2017-06-13" "2017-06-13" "2017-06-13"
## [36] "2017-06-14" "2017-06-14" "2017-06-14" "2017-06-14" "2017-06-14"
## [41] "2017-06-15" "2017-06-15" "2017-06-15" "2017-06-15" "2017-06-16"
## [46] "2017-06-16" "2017-06-16" "2017-06-16" "2017-06-16" "2017-06-17"
## [51] "2017-06-17" "2017-06-17" "2017-06-18" "2017-06-18" "2017-06-19"
## [56] "2017-06-19" "2017-06-19" "2017-06-19" "2017-06-20" "2017-06-20"
## [61] "2017-06-21" "2017-06-21" "2017-06-21" "2017-06-21" "2017-06-22"
## [66] "2017-06-22" "2017-06-22" "2017-06-23" "2017-06-24" "2017-06-25"
## [71] "2017-06-26" "2017-06-26" "2017-06-26" "2017-06-26" "2017-06-26"
## [76] "2017-06-26" "2017-06-27" "2017-06-28" "2017-06-28" "2017-06-28"
## [81] "2017-06-29" "2017-06-30"
# JULIO
julio$FECHA
##  [1] "2017-07-02" "2017-07-02" "2017-07-02" "2017-07-03" "2017-07-03"
##  [6] "2017-07-04" "2017-07-04" "2017-07-04" "2017-07-04" "2017-07-05"
## [11] "2017-07-05" "2017-07-05" "2017-07-05" "2017-07-05" "2017-07-07"
## [16] "2017-07-08" "2017-07-08" "2017-07-08" "2017-07-09" "2017-07-10"
## [21] "2017-07-10" "2017-07-10" "2017-07-11" "2017-07-11" "2017-07-11"
## [26] "2017-07-11" "2017-07-12" "2017-07-12" "2017-07-13" "2017-07-13"
## [31] "2017-07-13" "2017-07-13" "2017-07-14" "2017-07-14" "2017-07-14"
## [36] "2017-07-14" "2017-07-16" "2017-07-16" "2017-07-16" "2017-07-17"
## [41] "2017-07-17" "2017-07-18" "2017-07-19" "2017-07-20" "2017-07-21"
## [46] "2017-07-21" "2017-07-22" "2017-07-22" "2017-07-22" "2017-07-22"
## [51] "2017-07-23" "2017-07-23" "2017-07-24" "2017-07-24" "2017-07-24"
## [56] "2017-07-24" "2017-07-26" "2017-07-26" "2017-07-26" "2017-07-26"
## [61] "2017-07-27" "2017-07-27" "2017-07-27" "2017-07-28" "2017-07-29"
## [66] "2017-07-29" "2017-07-31" "2017-07-31" "2017-07-31" "2017-07-31"
# AGOSTO
agosto$FECHA
##  [1] "2017-08-01" "2017-08-01" "2017-08-01" "2017-08-01" "2017-08-01"
##  [6] "2017-08-01" "2017-08-01" "2017-08-01" "2017-08-02" "2017-08-02"
## [11] "2017-08-02" "2017-08-04" "2017-08-05" "2017-08-05" "2017-08-08"
## [16] "2017-08-08" "2017-08-10" "2017-08-10" "2017-08-12" "2017-08-12"
## [21] "2017-08-14" "2017-08-14" "2017-08-15" "2017-08-17" "2017-08-18"
## [26] "2017-08-18" "2017-08-20" "2017-08-20" "2017-08-20" "2017-08-21"
## [31] "2017-08-21" "2017-08-22" "2017-08-22" "2017-08-22" "2017-08-22"
## [36] "2017-08-23" "2017-08-24" "2017-08-24" "2017-08-24" "2017-08-26"
## [41] "2017-08-27" "2017-08-28" "2017-08-29" "2017-08-30" "2017-08-31"
## [46] "2017-08-31" "2017-08-31"
# SEPTIEMBRE
septiembre$FECHA
##  [1] "2017-09-01" "2017-09-01" "2017-09-02" "2017-09-02" "2017-09-03"
##  [6] "2017-09-04" "2017-09-04" "2017-09-04" "2017-09-04" "2017-09-05"
## [11] "2017-09-05" "2017-09-05" "2017-09-05" "2017-09-05" "2017-09-05"
## [16] "2017-09-07" "2017-09-07" "2017-09-07" "2017-09-08" "2017-09-09"
## [21] "2017-09-09" "2017-09-10" "2017-09-11" "2017-09-12" "2017-09-12"
## [26] "2017-09-12" "2017-09-13" "2017-09-13" "2017-09-15" "2017-09-15"
## [31] "2017-09-16" "2017-09-16" "2017-09-17" "2017-09-17" "2017-09-17"
## [36] "2017-09-17" "2017-09-17" "2017-09-17" "2017-09-18" "2017-09-18"
## [41] "2017-09-18" "2017-09-18" "2017-09-19" "2017-09-20" "2017-09-20"
## [46] "2017-09-20" "2017-09-21" "2017-09-21" "2017-09-21" "2017-09-21"
## [51] "2017-09-21" "2017-09-22" "2017-09-22" "2017-09-22" "2017-09-22"
## [56] "2017-09-23" "2017-09-23" "2017-09-23" "2017-09-23" "2017-09-23"
## [61] "2017-09-23" "2017-09-23" "2017-09-24" "2017-09-24" "2017-09-24"
## [66] "2017-09-24" "2017-09-24" "2017-09-24" "2017-09-26" "2017-09-26"
## [71] "2017-09-27" "2017-09-27" "2017-09-27" "2017-09-28" "2017-09-28"
## [76] "2017-09-28" "2017-09-29" "2017-09-29" "2017-09-29" "2017-09-29"
## [81] "2017-09-29" "2017-09-29" "2017-09-29" "2017-09-30" "2017-09-30"
# OCTUBRE
octubre$FECHA
##  [1] "2017-10-01" "2017-10-01" "2017-10-01" "2017-10-01" "2017-10-01"
##  [6] "2017-10-02" "2017-10-02" "2017-10-02" "2017-10-02" "2017-10-03"
## [11] "2017-10-03" "2017-10-03" "2017-10-04" "2017-10-05" "2017-10-05"
## [16] "2017-10-05" "2017-10-06" "2017-10-06" "2017-10-07" "2017-10-07"
## [21] "2017-10-07" "2017-10-08" "2017-10-08" "2017-10-09" "2017-10-10"
## [26] "2017-10-10" "2017-10-10" "2017-10-11" "2017-10-11" "2017-10-11"
## [31] "2017-10-12" "2017-10-12" "2017-10-12" "2017-10-12" "2017-10-14"
## [36] "2017-10-14" "2017-10-15" "2017-10-15" "2017-10-15" "2017-10-16"
## [41] "2017-10-16" "2017-10-16" "2017-10-17" "2017-10-17" "2017-10-19"
## [46] "2017-10-19" "2017-10-19" "2017-10-20" "2017-10-20" "2017-10-21"
## [51] "2017-10-21" "2017-10-21" "2017-10-21" "2017-10-22" "2017-10-23"
## [56] "2017-10-23" "2017-10-23" "2017-10-23" "2017-10-24" "2017-10-24"
## [61] "2017-10-24" "2017-10-25" "2017-10-25" "2017-10-25" "2017-10-25"
## [66] "2017-10-25" "2017-10-25" "2017-10-26" "2017-10-26" "2017-10-27"
## [71] "2017-10-27" "2017-10-27" "2017-10-27" "2017-10-27" "2017-10-28"
## [76] "2017-10-28" "2017-10-28" "2017-10-29" "2017-10-29" "2017-10-29"
## [81] "2017-10-29" "2017-10-29" "2017-10-29" "2017-10-29" "2017-10-30"
## [86] "2017-10-30" "2017-10-31" "2017-10-31"
# NOVIEMBRE
noviembre$FECHA
##  [1] "2017-11-01" "2017-11-01" "2017-11-01" "2017-11-02" "2017-11-02"
##  [6] "2017-11-02" "2017-11-04" "2017-11-04" "2017-11-06" "2017-11-06"
## [11] "2017-11-06" "2017-11-07" "2017-11-07" "2017-11-08" "2017-11-08"
## [16] "2017-11-08" "2017-11-08" "2017-11-08" "2017-11-08" "2017-11-09"
## [21] "2017-11-10" "2017-11-10" "2017-11-10" "2017-11-10" "2017-11-11"
## [26] "2017-11-12" "2017-11-12" "2017-11-13" "2017-11-14" "2017-11-16"
## [31] "2017-11-17" "2017-11-17" "2017-11-18" "2017-11-18" "2017-11-18"
## [36] "2017-11-18" "2017-11-19" "2017-11-19" "2017-11-21" "2017-11-21"
## [41] "2017-11-21" "2017-11-22" "2017-11-23" "2017-11-23" "2017-11-23"
## [46] "2017-11-24" "2017-11-24" "2017-11-26" "2017-11-26" "2017-11-27"
## [51] "2017-11-28" "2017-11-29" "2017-11-29" "2017-11-29" "2017-11-29"
## [56] "2017-11-29" "2017-11-29" "2017-11-29" "2017-11-30"
# DICIEMBRE
diciembre$FECHA
##  [1] "2017-12-01" "2017-12-01" "2017-12-02" "2017-12-03" "2017-12-05"
##  [6] "2017-12-07" "2017-12-08" "2017-12-10" "2017-12-10" "2017-12-12"
## [11] "2017-12-13" "2017-12-14" "2017-12-14" "2017-12-14" "2017-12-14"
## [16] "2017-12-14" "2017-12-15" "2017-12-17" "2017-12-18" "2017-12-19"
## [21] "2017-12-19" "2017-12-20" "2017-12-20" "2017-12-20" "2017-12-21"
## [26] "2017-12-21" "2017-12-21" "2017-12-23" "2017-12-23" "2017-12-23"
## [31] "2017-12-26" "2017-12-27" "2017-12-29" "2017-12-30" "2017-12-31"
#LO QUE QUEREMOS ES CUANTOS DE CADlength(enero$FECHA)A MES
#Utilizamos la función length() para ver cuantos registros

length(enero$FECHA)
## [1] 45
length(febrero$FECHA)
## [1] 49
length(marzo$FECHA)
## [1] 60
length(abril$FECHA)
## [1] 54
length(mayo$FECHA)
## [1] 82
length(junio$FECHA)
## [1] 82
length(julio$FECHA)
## [1] 70
length(agosto$FECHA)
## [1] 47
length(septiembre$FECHA)
## [1] 85
length(octubre$FECHA)
## [1] 88
length(noviembre$FECHA)
## [1] 59
length(diciembre$FECHA)
## [1] 35

#Construyendo un data.frame mas elegante

mesesNombres <- c("Enero", "Febrero", "Marzo", "Abril",
                 "Mayo", "Junio", "Julio", "Agosto",
                 "Septiembre", "Octubre", "Noviembre", "Diciembre")
resumen <- data.frame(mesesNombres, c(length(enero$FECHA),
                  length(febrero$FECHA), length(marzo$FECHA),
                    length(abril$FECHA), length(mayo$FECHA),length(junio$FECHA),
length(julio$FECHA),
length(agosto$FECHA),
length(septiembre$FECHA),
length(octubre$FECHA),
length(noviembre$FECHA),
length(diciembre$FECHA)))

resumen
##    mesesNombres
## 1         Enero
## 2       Febrero
## 3         Marzo
## 4         Abril
## 5          Mayo
## 6         Junio
## 7         Julio
## 8        Agosto
## 9    Septiembre
## 10      Octubre
## 11    Noviembre
## 12    Diciembre
##    c.length.enero.FECHA...length.febrero.FECHA...length.marzo.FECHA...
## 1                                                                   45
## 2                                                                   49
## 3                                                                   60
## 4                                                                   54
## 5                                                                   82
## 6                                                                   82
## 7                                                                   70
## 8                                                                   47
## 9                                                                   85
## 10                                                                  88
## 11                                                                  59
## 12                                                                  35

#Poniendo nombres de columnas a resumen y mostrar

colnames(resumen) <- c("Mes", "No.Accidentes")
resumen
##           Mes No.Accidentes
## 1       Enero            45
## 2     Febrero            49
## 3       Marzo            60
## 4       Abril            54
## 5        Mayo            82
## 6       Junio            82
## 7       Julio            70
## 8      Agosto            47
## 9  Septiembre            85
## 10    Octubre            88
## 11  Noviembre            59
## 12  Diciembre            35

Vamos a visualizar graficamente los datos

Utilizamos plot

plot(resumen, type="b")

Grafica a barras

#barplot(resumen$No.Accidentes, main = "Accidentes por mes", xlab = "Meses", ylab = "Accidentes", legend.text = mesesNombres, ) 
barplot(resumen$No.Accidentes, 
        main = "Accidentes por mes", 
        xlab = "Meses", 
        ylab = "Accidentes", 
        legend.text = mesesNombres, 
       col = c(1:12), 
        names.arg = mesesNombres,

)

Los datos de Accidentes 2017 nos muestran que los meses que tienen un indice mayor a 80 accidentes por mes son Mayo, Junio, Septiembre y Octubre:

Mayo 82

Junio 82

Septiembre 85

Octubre 88

Y el mes con menor número de accidentes es:

Diciembre