knitr::opts_chunk$set(echo = TRUE)
library(tidyr)
library(dplyr)
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(readr)
library(stringr)
library(ggplot2)

urlfile="https://raw.githubusercontent.com/Nhodgkinson/606-project/main/cdec-monthly-precipitation-san-joaquin-1913-2014.csv"

calidata<-read_csv(url(urlfile))
## Rows: 102 Columns: 15
## ── Column specification ────────────────────────────────────────────────────────
## Delimiter: ","
## chr  (1): Region
## dbl (14): WY, Oct, Nov, Dec, Jan, Feb, Mar, Apr, May, Jun, Jul, Aug, Sep, Total
## 
## ℹ Use `spec()` to retrieve the full column specification for this data.
## ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
calidata
## # A tibble: 102 × 15
##    Region         WY   Oct   Nov   Dec   Jan   Feb   Mar   Apr   May   Jun   Jul
##    <chr>       <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl>
##  1 San Joaquin  1913  1.01  2.8   1.26  5.4   1.74  2.96  2.11  2.09  2.77  1.12
##  2 San Joaquin  1914  0.08  4.55  7.91 21.3   5.17  0.94  5.18  1.05  1.07  0.02
##  3 San Joaquin  1915  1.71  0.61  3.92  7.68  9.2   2.73  3.53  6.94  0     0   
##  4 San Joaquin  1916  0     1.47  5.87 20     5.87  6.31  0.84  0.67  0     0   
##  5 San Joaquin  1917  6.77  1.64  8.19  1.69 12.5   2.78  1.46  1.71  0     0.24
##  6 San Joaquin  1918  0     1.53  1.79  0.97 11.0  11.7   0.42  1.84  0.15  0.2 
##  7 San Joaquin  1919  1.69  5.39  2.18  1.45 10.3   5.69  0.53  1.12  0     0   
##  8 San Joaquin  1920  0.95  0.78  6.34  1.45  4.29  9.55  4.86  0.15  0.57  0.02
##  9 San Joaquin  1921  5.41  4.36  6.25  9.69  3.33  4.53  0.7   2.25  0.3   0   
## 10 San Joaquin  1922  0.58  0.59 13.1   5.52  8.11  6.05  0.85  2.63  0.42  0.53
## # … with 92 more rows, and 3 more variables: Aug <dbl>, Sep <dbl>, Total <dbl>
#Year over Year info
cyeardf<-calidata[,c(1,2,15)]

cyeardf<- cyeardf %>%
  rename(Year = WY) %>%
  mutate(`Avg Rain` = mean(Total))

#Month Avgs
cmdf<-gather(calidata, "Month", "n", 3:14)

cmdf<-cmdf %>%
  rename(Year = WY) %>%
  group_by(Month) %>%
   mutate(`Avg Rain` = mean(n))%>%
  subset(select=-c(3))#2,5


cmdf
## # A tibble: 1,224 × 5
## # Groups:   Month [12]
##    Region       Year Month     n `Avg Rain`
##    <chr>       <dbl> <chr> <dbl>      <dbl>
##  1 San Joaquin  1913 Oct    1.01       2.06
##  2 San Joaquin  1914 Oct    0.08       2.06
##  3 San Joaquin  1915 Oct    1.71       2.06
##  4 San Joaquin  1916 Oct    0          2.06
##  5 San Joaquin  1917 Oct    6.77       2.06
##  6 San Joaquin  1918 Oct    0          2.06
##  7 San Joaquin  1919 Oct    1.69       2.06
##  8 San Joaquin  1920 Oct    0.95       2.06
##  9 San Joaquin  1921 Oct    5.41       2.06
## 10 San Joaquin  1922 Oct    0.58       2.06
## # … with 1,214 more rows
cyeardf
## # A tibble: 102 × 4
##    Region       Year Total `Avg Rain`
##    <chr>       <dbl> <dbl>      <dbl>
##  1 San Joaquin  1913  24.6       38.6
##  2 San Joaquin  1914  48.0       38.6
##  3 San Joaquin  1915  36.4       38.6
##  4 San Joaquin  1916  43         38.6
##  5 San Joaquin  1917  37.1       38.6
##  6 San Joaquin  1918  32.4       38.6
##  7 San Joaquin  1919  30.2       38.6
##  8 San Joaquin  1920  30.7       38.6
##  9 San Joaquin  1921  37.4       38.6
## 10 San Joaquin  1922  38.5       38.6
## # … with 92 more rows
summary(cmdf)
##     Region               Year         Month                 n         
##  Length:1224        Min.   :1913   Length:1224        Min.   : 0.000  
##  Class :character   1st Qu.:1938   Class :character   1st Qu.: 0.280  
##  Mode  :character   Median :1964   Mode  :character   Median : 1.645  
##                     Mean   :1964                      Mean   : 3.213  
##                     3rd Qu.:1989                      3rd Qu.: 4.803  
##                     Max.   :2014                      Max.   :28.710  
##     Avg Rain     
##  Min.   :0.1641  
##  1st Qu.:0.6314  
##  Median :2.7466  
##  Mean   :3.2132  
##  3rd Qu.:5.9208  
##  Max.   :6.8616
summary(cyeardf)
##     Region               Year          Total          Avg Rain    
##  Length:102         Min.   :1913   Min.   :14.63   Min.   :38.56  
##  Class :character   1st Qu.:1938   1st Qu.:28.40   1st Qu.:38.56  
##  Mode  :character   Median :1964   Median :36.86   Median :38.56  
##                     Mean   :1964   Mean   :38.56   Mean   :38.56  
##                     3rd Qu.:1989   3rd Qu.:44.45   3rd Qu.:38.56  
##                     Max.   :2014   Max.   :77.41   Max.   :38.56