https://www.datacamp.com/community/tutorials/data-table-cheat-sheet data.table cheat sheet
two csv files for the training can be found here: https://github.com/rlkirkham/data-table-training
library(data.table)
moviedata <- fread("H:/MOVIEDATA.csv", header=TRUE)str(moviedata)
### I operation ###moviedata[GENRE=="Action" | GENRE == "Drama"]moviedata[GENRE %in% list("Action", "Adventure", "Romance")]
### J Operation###moviedata[GENRE=="Action", sum(OVERALL)]moviedata[, .(GENRE, OVERALL)]
### By operation - need to have either a I or J operation with a by operation###moviedata[, sum(OVERALL), by= GENRE]moviedata[, sum(OVERALL), by= .(GENRE, GENRE2)]
moviedata[GENRE=="Action", sum(OVERALL, na.rm=TRUE), by= DECADE]
moviedata[, lapply(.SD, mean), by= GENRE]
setkey(moviedata, GENRE)
moviedata[, lapply(.SD, mean), by= GENRE, .SDcols= c("PLOT", "CHARACTER", "SOUND")]
moviedata[SCORE > 40, .SD, by= GENRE, .SDcols= c("PLOT", "CHARACTER")][, max(PLOT)]
flights <- fread("H:/data.table training/flights14.csv", header=TRUE)
setkey(flights, year, dep_time, tailnum)
flights[carrier=="UA"]
flights[, .N, by= carrier]flights[, mean(arr_delay), by=carrier]
averagedelay <- flights[, mean(arr_delay), by=carrier]setnames(averagedelay, "V1", "Mean_delay")
flights[, "total_delay" := arr_delay + dep_delay]
setkey(flights, carrier)flights["UA"]