# Load a built in dataset for airquality
data("airquality")
# Display first few rows
head(airquality)
summary(airquality)
## Ozone Solar.R Wind Temp
## Min. : 1.00 Min. : 7.0 Min. : 1.700 Min. :56.00
## 1st Qu.: 18.00 1st Qu.:115.8 1st Qu.: 7.400 1st Qu.:72.00
## Median : 31.50 Median :205.0 Median : 9.700 Median :79.00
## Mean : 42.13 Mean :185.9 Mean : 9.958 Mean :77.88
## 3rd Qu.: 63.25 3rd Qu.:258.8 3rd Qu.:11.500 3rd Qu.:85.00
## Max. :168.00 Max. :334.0 Max. :20.700 Max. :97.00
## NA's :37 NA's :7
## Month Day
## Min. :5.000 Min. : 1.0
## 1st Qu.:6.000 1st Qu.: 8.0
## Median :7.000 Median :16.0
## Mean :6.993 Mean :15.8
## 3rd Qu.:8.000 3rd Qu.:23.0
## Max. :9.000 Max. :31.0
##
#Now understanding how much the ozone levels vary:
var(airquality$Ozone, na.rm = TRUE)
## [1] 1088.201
sd(airquality$Ozone, na.rm = TRUE)
## [1] 32.98788
#Building a scatterplot of temperature vs ozone in order to see if hotter days have higher ozone
plot(airquality$Temp, airquality$Ozone,
main = "Ozone vs Temperature",
xlab = "Temperature (F)",
ylab = "Ozone (ppb)",
col = "blue", pch = 19)
