This project will showcase how R can perform statistical analysis to gain information from data.
data <- read.csv(file="http://latul.be/mbaa_531/data/tornado.csv",header = TRUE)
index1<- data$st== "WA" | data$st== "MS"
print(paste("Tronadoes recoreded in the WA or MS =",
sum(index1)))
## [1] "Tronadoes recoreded in the WA or MS = 530"
index2<-data$st== "WA"|data$yr>2012
print(paste("Tronadoes recoreded in WA After 2012 =",
sum(index2)))
## [1] "Tronadoes recoreded in WA After 2012 = 3070"
data <- read.csv(file ="http://latul.be/mbaa_531/data/tornado.csv",header = TRUE)
index <- data$st =="WA" & data$yr==2012|data$st =="WA"& data$yr==2013|data$st =="WA"& data$yr==2014
data[index,c("yr","mo","dy","date","time","tz","st","stf","f")]
index1<-data$st =="HI"
data[index1,c("st","mo","yr","f")]
meta <- read.csv(file ="http://latul.be/mbaa_531/data/tornado.csv",header = TRUE)
ordertype<- order(data$date,data$time)
head(meta[ordertype,])
for (x in 1:12) {
month<-data$mo == x
print(paste("month=",x,"Tornadoes=",sum(month)))
}
## [1] "month= 1 Tornadoes= 355"
## [1] "month= 2 Tornadoes= 463"
## [1] "month= 3 Tornadoes= 751"
## [1] "month= 4 Tornadoes= 2171"
## [1] "month= 5 Tornadoes= 2500"
## [1] "month= 6 Tornadoes= 1899"
## [1] "month= 7 Tornadoes= 861"
## [1] "month= 8 Tornadoes= 517"
## [1] "month= 9 Tornadoes= 401"
## [1] "month= 10 Tornadoes= 525"
## [1] "month= 11 Tornadoes= 350"
## [1] "month= 12 Tornadoes= 348"
airlineData <- read.csv(file = "http://latul.be/mbaa_531/data/airline.csv", header = TRUE)
col <- c("UniqueCarrier", "FlightNum", "Origin")
row <- airlineData$DepTime > 2200 & airlineData$Dest == "BNA"
print(airlineData[row,col])
## UniqueCarrier FlightNum Origin
## NA <NA> NA <NA>
## 7021 OH 5421 CVG
## NA.1 <NA> NA <NA>
## 17401 AA 2435 ORD
## 19478 DH 7332 ORD
col2 <- c("UniqueCarrier", "FlightNum", "Origin", "DepTime", "Dest")
#row2 <- (airlineData$DepTime > 2200 & airlineData$Origin == "BNA" ) | (airlineData$DepTime > 2200 & airlineData$Dest == "MEM")
row2 <- (airlineData$DepTime > 2200) & (airlineData$Origin == "BNA" | airlineData$Dest == "MEM")
airlineData[row2,col2]
col3 <- c("UniqueCarrier", "FlightNum", "Origin", "ArrDelay")
row3 <- airlineData$ArrDelay > 2
head(airlineData[row3,col3], n=20)
col4 <- c("UniqueCarrier", "FlightNum", "Origin", "ArrDelay", "DepDelay")
row4 <- airlineData$ArrDelay > 2 & airlineData$DepDelay <= 0
head(airlineData[row4,col4], n=20)
col <- c("UniqueCarrier", "FlightNum", "Origin", "DepDelay")
order <- order(-airlineData$DepDelay)
head(airlineData[order,col], n=5)
col <- c("UniqueCarrier", "FlightNum", "Origin", "DepDelay")
order <- order(airlineData$DepDelay)
head(airlineData[order,col], n=5)
col <- c("UniqueCarrier", "FlightNum", "Origin", "Dest", "ArrDelay")
order <- order(airlineData$Dest,-airlineData$ArrDelay)
head(airlineData[order,col], n=30)