library(dplyr)
library(ggplot2)
#get data
NEI <- readRDS("summarySCC_PM25.rds")
SCC <- readRDS("Source_Classification_Code.rds")

#join tables
FULL <- tbl_df(merge(NEI, SCC, by = "SCC"))
library(dplyr)
year_sum <- NEI %>%
  group_by(year) %>%
  summarize(totalEmissions = sum(Emissions))
options(scipen=5)
plot(year_sum, type = 'l') +
  title(main = "PM2.5 Emissions")

## numeric(0)
library(dplyr)
bmore_yr_sum <- NEI %>%
  filter(fips == "24510") %>%
  group_by(year) %>%
  summarize(totalBaltimoreEmissions = sum(Emissions))
options(scipen=5)
plot(bmore_yr_sum, type = 'l') + 
  title(main = "PM2.5 Emissions - Baltimore, MD")

## numeric(0)
type_yr_sum <- NEI %>%
  group_by(year,type) %>%
  summarize(totalEmissions = sum(Emissions)) %>%
  mutate(difference = totalEmissions - lag(totalEmissions,1))


par(mfrow=c(1,2))
with(type_yr_sum, {
  
  qplot(year,totalEmissions,
        color = type,
        geom = 'line') + scale_y_log10()
  
  qplot(year,difference,
        color=type,
        geom='line') + scale_y_log10()
})
## Warning in self$trans$transform(x): NaNs produced

v <- FULL[grep('.*[Cc]oal.*',FULL$EI.Sector),]

coal_yr_sum <- v %>%
  group_by(year) %>%
  summarize(totalCoalEmissionsUS = sum(Emissions))

with(coal_yr_sum, {
  qplot(year, totalCoalEmissionsUS,
        geom = 'line') + ggtitle("Total Emissions from Coal-related Sources")
})

w <- FULL[grep('.*[V]ehicle',FULL$EI.Sector),]

vehicle_yr_sum <- w %>%
  filter(fips == "24510") %>%
  group_by(year) %>%
  summarize(BaltimoreCityVehicleEmissions = sum(Emissions))

with(vehicle_yr_sum, {
  qplot(year, BaltimoreCityVehicleEmissions,
        geom = 'line') + ggtitle("Baltimore City Vehicle-related Emissions")
})

w <- FULL[grep('.*[V]ehicle',FULL$EI.Sector),]

BaltLA_yr_sum <- w %>%
  filter(fips== "06037"|fips=="24510") %>%
  mutate(CountyName = ifelse(fips=="06037","LA County","Baltimore City")) %>%
  group_by(year,fips,CountyName) %>%
  rename(County = fips) %>%
  summarize(totalVehicleEmissionsUS = sum(Emissions))

with(BaltLA_yr_sum, {
  qplot(year, totalVehicleEmissionsUS,
        color = CountyName,
        geom = 'line') + scale_y_log10() + ggtitle("Vehicle-related emissions for Baltimore City vs LA County")
})