# Load a built in dataset for airquality
data("airquality")
# Display first few rows
head(airquality)
summary(airquality)
##      Ozone           Solar.R           Wind             Temp      
##  Min.   :  1.00   Min.   :  7.0   Min.   : 1.700   Min.   :56.00  
##  1st Qu.: 18.00   1st Qu.:115.8   1st Qu.: 7.400   1st Qu.:72.00  
##  Median : 31.50   Median :205.0   Median : 9.700   Median :79.00  
##  Mean   : 42.13   Mean   :185.9   Mean   : 9.958   Mean   :77.88  
##  3rd Qu.: 63.25   3rd Qu.:258.8   3rd Qu.:11.500   3rd Qu.:85.00  
##  Max.   :168.00   Max.   :334.0   Max.   :20.700   Max.   :97.00  
##  NA's   :37       NA's   :7                                       
##      Month            Day      
##  Min.   :5.000   Min.   : 1.0  
##  1st Qu.:6.000   1st Qu.: 8.0  
##  Median :7.000   Median :16.0  
##  Mean   :6.993   Mean   :15.8  
##  3rd Qu.:8.000   3rd Qu.:23.0  
##  Max.   :9.000   Max.   :31.0  
## 
#Now understanding how much the ozone levels vary:
var(airquality$Ozone, na.rm = TRUE)
## [1] 1088.201
sd(airquality$Ozone, na.rm = TRUE)
## [1] 32.98788
#Building a scatterplot of temperature vs ozone in order to see if hotter days have higher ozone
plot(airquality$Temp, airquality$Ozone,
     main = "Ozone vs Temperature",
     xlab = "Temperature (F)",
     ylab = "Ozone (ppb)",
     col = "blue", pch = 19)