## Leer datasets
##Archivos .csv txt tsv 

library(readr)

#read.csv()  #Archivos.csv "separados por comas"
#read.table() #Archivos. txt "separado por espacios"
#read.csv2()  #Archivos que estan separados por ;
#read_tsv()   # cuando los archivos estan dilimitados por el TAB

# Archivo excel
#install.packages("readxl")
library(readxl)
#read_excel()
#read_xls()
#read_xlsx()

url <- "https://raw.githubusercontent.com/rafalab/dslabs/master/inst/extdata/murders.csv"
murders <- read.csv(url)
download.file(url,"murders.csv")

# resumen 
library(dplyr)
## 
## Adjuntando el paquete: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(dslabs)
## 
## Adjuntando el paquete: 'dslabs'
## The following object is masked _by_ '.GlobalEnv':
## 
##     murders
data("heights")

# Calcular el promedio y la desviacion estandar por genero 

sm<-heights %>% filter(sex=="Male") %>%
  summarise(mean=mean(height), sd=sd(height))

## Interpretar los resultados
sm$mean
## [1] 69.31475
sm$sd
## [1] 3.611024
sf<-heights %>% filter(sex=="Female") %>%
  summarise(mean=mean(height), sd=sd(height))

data("murders")

head(murders)
##        state abb region population total
## 1    Alabama  AL  South    4779736   135
## 2     Alaska  AK   West     710231    19
## 3    Arizona  AZ   West    6392017   232
## 4   Arkansas  AR  South    2915918    93
## 5 California  CA   West   37253956  1257
## 6   Colorado  CO   West    5029196    65
max_total<- murders$state[which.max(murders$total)]

max_total2<- murders$state[which.max(murders$population)]

murders<- murders %>% mutate(rate=total*100000/population)

head(murders) 
##        state abb region population total     rate
## 1    Alabama  AL  South    4779736   135 2.824424
## 2     Alaska  AK   West     710231    19 2.675186
## 3    Arizona  AZ   West    6392017   232 3.629527
## 4   Arkansas  AR  South    2915918    93 3.189390
## 5 California  CA   West   37253956  1257 3.374138
## 6   Colorado  CO   West    5029196    65 1.292453
meanrate<- murders %>% select(rate) %>% summarise(mean(rate))
meanrate
##   mean(rate)
## 1   2.779125
murders<- murders%>%mutate(dif=meanrate$`mean(rate)`-rate)
head(murders)
##        state abb region population total     rate         dif
## 1    Alabama  AL  South    4779736   135 2.824424 -0.04529833
## 2     Alaska  AK   West     710231    19 2.675186  0.10393949
## 3    Arizona  AZ   West    6392017   232 3.629527 -0.85040182
## 4   Arkansas  AR  South    2915918    93 3.189390 -0.41026465
## 5 California  CA   West   37253956  1257 3.374138 -0.59501286
## 6   Colorado  CO   West    5029196    65 1.292453  1.48667234
quantile(murders$rate,c(0.5,0,1))
##        50%         0%       100% 
##  2.6871225  0.3196211 16.4527532