knitr::opts_chunk$set(echo = TRUE)
library(tidyr)
library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(readr)
library(stringr)
library(ggplot2)
urlfile="https://raw.githubusercontent.com/Nhodgkinson/606-project/main/cdec-monthly-precipitation-san-joaquin-1913-2014.csv"
calidata<-read_csv(url(urlfile))
## Rows: 102 Columns: 15
## ── Column specification ────────────────────────────────────────────────────────
## Delimiter: ","
## chr (1): Region
## dbl (14): WY, Oct, Nov, Dec, Jan, Feb, Mar, Apr, May, Jun, Jul, Aug, Sep, Total
##
## ℹ Use `spec()` to retrieve the full column specification for this data.
## ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
calidata
## # A tibble: 102 × 15
## Region WY Oct Nov Dec Jan Feb Mar Apr May Jun Jul
## <chr> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl>
## 1 San Joaquin 1913 1.01 2.8 1.26 5.4 1.74 2.96 2.11 2.09 2.77 1.12
## 2 San Joaquin 1914 0.08 4.55 7.91 21.3 5.17 0.94 5.18 1.05 1.07 0.02
## 3 San Joaquin 1915 1.71 0.61 3.92 7.68 9.2 2.73 3.53 6.94 0 0
## 4 San Joaquin 1916 0 1.47 5.87 20 5.87 6.31 0.84 0.67 0 0
## 5 San Joaquin 1917 6.77 1.64 8.19 1.69 12.5 2.78 1.46 1.71 0 0.24
## 6 San Joaquin 1918 0 1.53 1.79 0.97 11.0 11.7 0.42 1.84 0.15 0.2
## 7 San Joaquin 1919 1.69 5.39 2.18 1.45 10.3 5.69 0.53 1.12 0 0
## 8 San Joaquin 1920 0.95 0.78 6.34 1.45 4.29 9.55 4.86 0.15 0.57 0.02
## 9 San Joaquin 1921 5.41 4.36 6.25 9.69 3.33 4.53 0.7 2.25 0.3 0
## 10 San Joaquin 1922 0.58 0.59 13.1 5.52 8.11 6.05 0.85 2.63 0.42 0.53
## # … with 92 more rows, and 3 more variables: Aug <dbl>, Sep <dbl>, Total <dbl>
#Year over Year info
cyeardf<-calidata[,c(1,2,15)]
cyeardf<- cyeardf %>%
rename(Year = WY) %>%
mutate(`Avg Rain` = mean(Total))
#Month Avgs
cmdf<-gather(calidata, "Month", "n", 3:14)
cmdf<-cmdf %>%
rename(Year = WY) %>%
group_by(Month) %>%
mutate(`Avg Rain` = mean(n))%>%
subset(select=-c(3))#2,5
cmdf
## # A tibble: 1,224 × 5
## # Groups: Month [12]
## Region Year Month n `Avg Rain`
## <chr> <dbl> <chr> <dbl> <dbl>
## 1 San Joaquin 1913 Oct 1.01 2.06
## 2 San Joaquin 1914 Oct 0.08 2.06
## 3 San Joaquin 1915 Oct 1.71 2.06
## 4 San Joaquin 1916 Oct 0 2.06
## 5 San Joaquin 1917 Oct 6.77 2.06
## 6 San Joaquin 1918 Oct 0 2.06
## 7 San Joaquin 1919 Oct 1.69 2.06
## 8 San Joaquin 1920 Oct 0.95 2.06
## 9 San Joaquin 1921 Oct 5.41 2.06
## 10 San Joaquin 1922 Oct 0.58 2.06
## # … with 1,214 more rows
cyeardf
## # A tibble: 102 × 4
## Region Year Total `Avg Rain`
## <chr> <dbl> <dbl> <dbl>
## 1 San Joaquin 1913 24.6 38.6
## 2 San Joaquin 1914 48.0 38.6
## 3 San Joaquin 1915 36.4 38.6
## 4 San Joaquin 1916 43 38.6
## 5 San Joaquin 1917 37.1 38.6
## 6 San Joaquin 1918 32.4 38.6
## 7 San Joaquin 1919 30.2 38.6
## 8 San Joaquin 1920 30.7 38.6
## 9 San Joaquin 1921 37.4 38.6
## 10 San Joaquin 1922 38.5 38.6
## # … with 92 more rows
summary(cmdf)
## Region Year Month n
## Length:1224 Min. :1913 Length:1224 Min. : 0.000
## Class :character 1st Qu.:1938 Class :character 1st Qu.: 0.280
## Mode :character Median :1964 Mode :character Median : 1.645
## Mean :1964 Mean : 3.213
## 3rd Qu.:1989 3rd Qu.: 4.803
## Max. :2014 Max. :28.710
## Avg Rain
## Min. :0.1641
## 1st Qu.:0.6314
## Median :2.7466
## Mean :3.2132
## 3rd Qu.:5.9208
## Max. :6.8616
summary(cyeardf)
## Region Year Total Avg Rain
## Length:102 Min. :1913 Min. :14.63 Min. :38.56
## Class :character 1st Qu.:1938 1st Qu.:28.40 1st Qu.:38.56
## Mode :character Median :1964 Median :36.86 Median :38.56
## Mean :1964 Mean :38.56 Mean :38.56
## 3rd Qu.:1989 3rd Qu.:44.45 3rd Qu.:38.56
## Max. :2014 Max. :77.41 Max. :38.56