library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(nycflights13)
library(tidyr)
vuelos <- filter(flights, arr_delay >=120)
vuelos
viajeHou <- filter(flights, dest == "IAH" | dest == "HOU")
viajeHou
operadospor <- filter(flights, carrier == "AA" | carrier == "UA" | carrier =="DL")
operadospor
vuelos_en_verano <- filter(flights, month == 7 | month == 8 | month == 9)
vuelos_en_verano
vuelos_llego_tarde <- filter(flights, dep_delay <= 0, arr_delay >= 120)
vuelos_llego_tarde
vuelos_retrasados <- filter(flights, dep_delay - arr_delay > 30, dep_delay >= 60)
vuelos_retrasados
salida_vuelos <- filter(flights, dep_time== 2400 | dep_time <= 600)
salida_vuelos
valores_faltantes <- arrange(flights, desc(dep_delay))
valores_faltantes
vuelos_mas_rapidos <- arrange(flights, distance/air_time*60)
vuelos_mas_rapidos
seleccion <- select(flights, salida = dep_time, llegada = arr_time, retrasos_salida = dep_delay,
retraso_llegada = arr_delay)
seleccion
R: select() mostrara una vez el contenido de la variable
prueba <- select(flights, dest, dest, dest)
prueba
cant_minutos <- mutate(flights, salida = (dep_time %/% 100*60 + dep_time %/% 100)%%1400,
sal_programada = (sched_dep_time %/% 100 * 60 + sched_dep_time %% 100) %% 1400)
select(cant_minutos, sched_dep_time, sal_programada, dep_time, salida)
peor_record <- flights
peor_record %>%
group_by(tailnum) %>%
summarise(peor_tiempo = mean(arr_delay)) %>%
filter( min_rank(desc(peor_tiempo)) <= 1)