#VARIABLES CUALITATIVAS

VARIABLES CATEGORICAS Y SE DIVIDEN EN DOS: ORDINALES (tienen orden) Y NOMINALES (no tienen orden)

##variables cuantitativas

expresar numericamente y se dividen en dos: discretas y continuas

library(dplyr)
## 
## Adjuntando el paquete: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(dslabs)
library(viridisLite)

#dataset

data("muders")
## Warning in data("muders"): data set 'muders' not found

#Graficos

#Diagramas de barras

levels(murders$region)
## [1] "Northeast"     "South"         "North Central" "West"
tabla <- table(murders$region)
tabla
## 
##     Northeast         South North Central          West 
##             9            17            12            13
miGraficoBarras <-barplot(tabla, main="Grafico de barras",
                          ylab = "Frecuencia",
                          xlab = "Region",
                          ylim = c(0,20),
                          col = "red"
                          )
#Usamos la funcion text para agregar las etiquetas de datos de cada barra
text(x = miGraficoBarras, y = tabla, labels = tabla, pos = 3, cex = 1.0, col = "black")

#Calculamos los porcentajes
porcentajes <- round(tabla/sum(tabla)*100,2)
#Creamos las etiquetas con el porcentaje
etiquetas <- paste(porcentajes, "%")
#Creo mi grafico
pie(tabla,
    labels = etiquetas,
    col = rainbow(4),
    main="Diagrama de torta"
)
legend("topleft",
       legend = names(tabla),fill = rainbow(4))

#Histograma

#Creamos nuestro dataset con la base de datos murders agregando el campo rate (tasa de asesinatos)
dsMurders <- murders %>%
              mutate(murders,rate = total/population*100000)
#Verifico mi dataset para ver si se agrego la columna rate
dsMurders
##                   state abb        region population total       rate
## 1               Alabama  AL         South    4779736   135  2.8244238
## 2                Alaska  AK          West     710231    19  2.6751860
## 3               Arizona  AZ          West    6392017   232  3.6295273
## 4              Arkansas  AR         South    2915918    93  3.1893901
## 5            California  CA          West   37253956  1257  3.3741383
## 6              Colorado  CO          West    5029196    65  1.2924531
## 7           Connecticut  CT     Northeast    3574097    97  2.7139722
## 8              Delaware  DE         South     897934    38  4.2319369
## 9  District of Columbia  DC         South     601723    99 16.4527532
## 10              Florida  FL         South   19687653   669  3.3980688
## 11              Georgia  GA         South    9920000   376  3.7903226
## 12               Hawaii  HI          West    1360301     7  0.5145920
## 13                Idaho  ID          West    1567582    12  0.7655102
## 14             Illinois  IL North Central   12830632   364  2.8369608
## 15              Indiana  IN North Central    6483802   142  2.1900730
## 16                 Iowa  IA North Central    3046355    21  0.6893484
## 17               Kansas  KS North Central    2853118    63  2.2081106
## 18             Kentucky  KY         South    4339367   116  2.6732010
## 19            Louisiana  LA         South    4533372   351  7.7425810
## 20                Maine  ME     Northeast    1328361    11  0.8280881
## 21             Maryland  MD         South    5773552   293  5.0748655
## 22        Massachusetts  MA     Northeast    6547629   118  1.8021791
## 23             Michigan  MI North Central    9883640   413  4.1786225
## 24            Minnesota  MN North Central    5303925    53  0.9992600
## 25          Mississippi  MS         South    2967297   120  4.0440846
## 26             Missouri  MO North Central    5988927   321  5.3598917
## 27              Montana  MT          West     989415    12  1.2128379
## 28             Nebraska  NE North Central    1826341    32  1.7521372
## 29               Nevada  NV          West    2700551    84  3.1104763
## 30        New Hampshire  NH     Northeast    1316470     5  0.3798036
## 31           New Jersey  NJ     Northeast    8791894   246  2.7980319
## 32           New Mexico  NM          West    2059179    67  3.2537239
## 33             New York  NY     Northeast   19378102   517  2.6679599
## 34       North Carolina  NC         South    9535483   286  2.9993237
## 35         North Dakota  ND North Central     672591     4  0.5947151
## 36                 Ohio  OH North Central   11536504   310  2.6871225
## 37             Oklahoma  OK         South    3751351   111  2.9589340
## 38               Oregon  OR          West    3831074    36  0.9396843
## 39         Pennsylvania  PA     Northeast   12702379   457  3.5977513
## 40         Rhode Island  RI     Northeast    1052567    16  1.5200933
## 41       South Carolina  SC         South    4625364   207  4.4753235
## 42         South Dakota  SD North Central     814180     8  0.9825837
## 43            Tennessee  TN         South    6346105   219  3.4509357
## 44                Texas  TX         South   25145561   805  3.2013603
## 45                 Utah  UT          West    2763885    22  0.7959810
## 46              Vermont  VT     Northeast     625741     2  0.3196211
## 47             Virginia  VA         South    8001024   250  3.1246001
## 48           Washington  WA          West    6724540    93  1.3829942
## 49        West Virginia  WV         South    1852994    27  1.4571013
## 50            Wisconsin  WI North Central    5686986    97  1.7056487
## 51              Wyoming  WY          West     563626     5  0.8871131
#Creamos el grafico de tipo histograma usando la funcion hist y definimos cada una de sus caracteristicas
miHistograma <- hist(dsMurders$rate,
                     main="Histograma de asesinatos por arma de fuego",
                     labels = TRUE,
                     xlab = "Tasa",
                     ylim = c(0,30),
                     xlim = c(0,20),
                     col = "green"
                     )
#Usamos la funcion axis para modificar el tamaño de los intervalos que se muestran en el eje x
axis(1,at=seq(0,20,by=1))

#Boxplot

boxplot(dsMurders$rate, col="Gray",ylab="Tasa de asesinatos",outline=FALSE,main="Boxplot",ylim=c(0,6))
#Adicionar la media
points(mean(dsMurders$rate),col="black",pch=20)
text(paste(" ", round(min(dsMurders$rate), 2)," min"),x=1.3,y=0.3)
text(paste(" ", round(quantile(dsMurders$rate,0.25),2)," Q1"),x=1.3,y=1.3)
text(paste(" ", round(median(dsMurders$rate), 2)," mediana"),x=1.3,y=2.3) 
text(paste(" ", round(mean(dsMurders$rate), 2)," media"),x=1.3,y=2.6)
text(paste(" ", round(quantile(dsMurders$rate,0.75),2)," Q2"),x=1.3,y=3.3)
text(paste(" ", round(max(dsMurders$rate), 2)," max"),x=1.3,y=5.3)

summary(dsMurders$rate)
##    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
##  0.3196  1.2526  2.6871  2.7791  3.3861 16.4528
#haga el grafico
#Use la paleta de colores