#Variable cuantitativa y cualitativa

##Variables caulitativas #categoricas y se dividen en dos: ordinales y nominales

#Variables cuantitativas #expresar numericamente, discretas y continuas

library(dplyr)
## 
## Adjuntando el paquete: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(dslabs)
library(viridisLite)

#Dataset

data("murders")

#Graficos

##Diagrama de barras

levels(murders$region)
## [1] "Northeast"     "South"         "North Central" "West"
tabla <- table(murders$region)

barplot(tabla, main = "Grafico de barras", ylab = "Frecuencia", xlab = "Regiones", ylim = c(0,20),col = "red", ) %>% text(y = tabla, label = tabla, pos = 3, cex = 0.8, col = "blue")

help("barplot")
## starting httpd help server ... done

#Diagrama de torta

pie(tabla, labels = row.names(tabla), col = viridis(4), main = "Diagrama circular", borde = viridis(4))
#col = el nombre de la paleta y el numero
porcentajes <- round(tabla * 100/ sum(tabla) , 2)
etiquetas <- paste0(murders$region, " (", porcentajes, ")")
legend("topright",legend=names(tabla),cex=0.75,fill=viridis(4))

#crear tabla de porcentajes y graficar mostrando el dato

requiero un orden especifico

region<-factor(murders$region, levels=c("South", "West", "North Central", "Northeast"))
tabla1<-table(region)
barplot(tabla1)

#Histograma

murders <- murders  %>% mutate(murders, rate = total/population*100000)

hist(murders$rate, main = "Histograma tasa de asesinatos", ylab = "Frecuencia", xlab = "Tasa de asesinatos", xlim = c(0,20), ylim = c(0,25), col = rocket(4)) 

#Grafico grafico de cajas

boxplot(murders$rate, col="Blue",ylab="Tasa de asesinatos",outline=FALSE,main="Boxplot",ylim=c(0,6))

#Adicionar la media

points(mean(murders$rate),col="black",pch=20)
text(paste(" ", round(mean(murders$rate), 2)),x=1.1,y=2.3) 

#comparacion variables cuantitativas y cualitativas

#diagrama de dispersion total vs poblacion

x<-murders$population/10^6
y<-murders$total
plot(x,y,main="Total vs Population",col=murders$region,pch=20,xlab = "Population/10^6",ylab="Population")
legend("bottomright",legend=levels(murders$region),fill = unique(murders$region))

#bolxplot rate vs region
boxplot(rate~region,data=murders,col=rocket(4),outline=FALSE,ylim=c(0,6))
abline(h=mean(murders$rate),col="red",lwd=2)
text(paste("",round(mean(murders$rate),2)),x=0.5,y=3,col="green")

#varios graficos

par(mfrow=c(1,2))

plot(x,y,main="Total vs Population",col=murders$region,pch=20,xlab = "Population/10^6",ylab="Population")
legend("bottomright",legend=levels(murders$region),fill = unique(murders$region))

boxplot(rate~region,data=murders,col=rocket(4),outline=FALSE,ylim=c(0,6))
abline(h=mean(murders$rate),col="red",lwd=2)
text(paste("",round(mean(murders$rate),2)),x=0.7,y=3,col="green")