The number of Fatalities
library(sqldf)
sumOfFatalities <- sqldf("select EVTYPE, sum(FATALITIES) as sumF from mainFullDF where FYEARS >= '1990' and FYEARS < '2011' group by EVTYPE")
print(paste0("The number of Fatalities between 1990 and 2010 was ",sum(sumOfFatalities[2])))
## [1] "The number of Fatalities between 1990 and 2010 was 10085"
sumOfFatalitiesTop10 <- sqldf("select EVTYPE, sum(FATALITIES) as sumF from mainFullDF where FYEARS >= '1990' and FYEARS < '2011' group by EVTYPE order by sumF desc limit 10")
print(sumOfFatalitiesTop10)
## EVTYPE sumF
## 1 EXCESSIVE HEAT 1867
## 2 TORNADO 1165
## 3 FLASH FLOOD 910
## 4 HEAT 874
## 5 LIGHTNING 790
## 6 FLOOD 412
## 7 RIP CURRENT 339
## 8 TSTM WIND 327
## 9 HIGH WIND 244
## 10 AVALANCHE 215
library(easyGgplot2)
ggplot2.barplot(data=sumOfFatalitiesTop10, xName="EVTYPE", yName="sumF",
groupName="EVTYPE")

The number of Injuries
library(sqldf)
sumOfInjuries <- sqldf("select EVTYPE, sum(INJURIES) as SumI from mainFullDF where FYEARS >= '1990' and FYEARS < '2011' group by EVTYPE")
print(paste0("The number of Injuries between 1990 and 2010 was ",sum(sumOfInjuries[2])))
## [1] "The number of Injuries between 1990 and 2010 was 65907"
sumOfInjuriesTop10 <- sqldf("select EVTYPE, sum(INJURIES) as SumI from mainFullDF where FYEARS >= '1990' and FYEARS < '2011' group by EVTYPE order by SumI desc limit 10")
print(sumOfInjuriesTop10)
## EVTYPE SumI
## 1 TORNADO 20511
## 2 FLOOD 6779
## 3 EXCESSIVE HEAT 6387
## 4 LIGHTNING 5036
## 5 TSTM WIND 5022
## 6 ICE STORM 1975
## 7 FLASH FLOOD 1747
## 8 HEAT 1489
## 9 WINTER STORM 1321
## 10 HURRICANE/TYPHOON 1275
library(easyGgplot2)
ggplot2.barplot(data=sumOfInjuriesTop10, xName="EVTYPE", yName="SumI",
groupName="EVTYPE")

Subset Prop/Crop Damage Estimates values
mutatePropDMG <- function(){
library(dplyr)
mainFullDF <<- mainFullDF %>%
mutate(FPROPDMG = ifelse(is.null(PROPDMGEXP) | is.na(PROPDMGEXP) | PROPDMGEXP=="",0,
ifelse(PROPDMGEXP=='H',2,
ifelse(PROPDMGEXP=='K',3,
ifelse(PROPDMGEXP=='M',6,
ifelse(PROPDMGEXP=='B',9,PROPDMGEXP))))))
}
mutateCropDMG <- function(){
library(dplyr)
mainFullDF <<- mainFullDF %>%
mutate(FCROPDMG = ifelse(is.null(CROPDMGEXP) | is.na(CROPDMGEXP) | CROPDMGEXP=="",0,
ifelse(CROPDMGEXP=='H',2,
ifelse(CROPDMGEXP=='K',3,
ifelse(CROPDMGEXP=='M',6,
ifelse(CROPDMGEXP=='B',9,CROPDMGEXP))))))
}
mutatePropDMG()
##
## Attaching package: 'dplyr'
##
## The following object is masked from 'package:stats':
##
## filter
##
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
mutateCropDMG()
names(mainFullDF)
## [1] "STATE__" "BGN_DATE" "BGN_TIME" "TIME_ZONE" "COUNTY"
## [6] "COUNTYNAME" "STATE" "EVTYPE" "BGN_RANGE" "BGN_AZI"
## [11] "BGN_LOCATI" "END_DATE" "END_TIME" "COUNTY_END" "COUNTYENDN"
## [16] "END_RANGE" "END_AZI" "END_LOCATI" "LENGTH" "WIDTH"
## [21] "F" "MAG" "FATALITIES" "INJURIES" "PROPDMG"
## [26] "PROPDMGEXP" "CROPDMG" "CROPDMGEXP" "WFO" "STATEOFFIC"
## [31] "ZONENAMES" "LATITUDE" "LONGITUDE" "LATITUDE_E" "LONGITUDE_"
## [36] "REMARKS" "REFNUM" "FYEARS" "FPROPDMG" "FCROPDMG"
library(sqldf)
sumOfMostdemagepropsTop10 <- sqldf("select EVTYPE, sum(FPROPDMG) as sumProp from mainFullDF group by EVTYPE order by sumProp desc limit 10")
print(sumOfMostdemagepropsTop10)
## EVTYPE sumProp
## 1 HAIL 225321
## 2 TSTM WIND 190148
## 3 THUNDERSTORM WIND 181430
## 4 FLASH FLOOD 92426
## 5 TORNADO 62025
## 6 FLOOD 45224
## 7 THUNDERSTORM WINDS 36902
## 8 HIGH WIND 36867
## 9 LIGHTNING 31136
## 10 WINTER STORM 19427
library(easyGgplot2)
ggplot2.barplot(data=sumOfMostdemagepropsTop10, xName="EVTYPE", yName="sumProp",
groupName="EVTYPE")

library(sqldf)
sumOfMostdemageCropsTop10 <- sqldf("select EVTYPE, sum(FCROPDMG) as sumCrop from mainFullDF group by EVTYPE order by sumCrop desc limit 10")
print(sumOfMostdemageCropsTop10)
## EVTYPE sumCrop
## 1 HAIL 195315
## 2 THUNDERSTORM WIND 179382
## 3 FLASH FLOOD 54879
## 4 FLOOD 30951
## 5 HIGH WIND 28236
## 6 TORNADO 22449
## 7 TSTM WIND 20226
## 8 WINTER STORM 16644
## 9 WINTER WEATHER 16230
## 10 HEAVY SNOW 15282
library(easyGgplot2)
ggplot2.barplot(data=sumOfMostdemageCropsTop10, xName="EVTYPE", yName="sumCrop",
groupName="EVTYPE")
