madrid <- read.csv("madrid.csv")
(cols_withNa <- apply(madrid, 2, function(x) sum(is.na(x))))
##                        CET           Max.TemperatureC 
##                          0                          2 
##          Mean.TemperatureC           Min.TemperatureC 
##                          3                          2 
##                 Dew.PointC             MeanDew.PointC 
##                          2                          2 
##              Min.DewpointC               Max.Humidity 
##                          2                          2 
##              Mean.Humidity               Min.Humidity 
##                          2                          2 
##  Max.Sea.Level.PressurehPa Mean.Sea.Level.PressurehPa 
##                          0                          0 
##  Min.Sea.Level.PressurehPa           Max.VisibilityKm 
##                          0                        940 
##          Mean.VisibilityKm           Min.VisibilitykM 
##                        940                        940 
##         Max.Wind.SpeedKm.h        Mean.Wind.SpeedKm.h 
##                          0                          0 
##         Max.Gust.SpeedKm.h            Precipitationmm 
##                       3306                          0 
##                 CloudCover                     Events 
##                       1372                          0 
##             WindDirDegrees 
##                          0
require(dplyr)
## Loading required package: dplyr
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
madrid <- madrid %>%
  select(-c(CloudCover,Max.Gust.SpeedKm.h, Max.VisibilityKm, Mean.VisibilityKm,Min.VisibilitykM))

madrid$CET <- as.Date(madrid$CET)

names(madrid)[1] <- c("Date")

madrid <- madrid[complete.cases(madrid),]

madrid <- as.data.frame(madrid)

plot(madrid$Mean.TemperatureC,type = "l",main="Mean Temperature (C)")

plot(madrid$MeanDew.PointC,type = "l",main="Mean DewPoint")

plot(madrid$Mean.Humidity,type = "l",main="Mean Humidity")

plot(madrid$Mean.Sea.Level.PressurehPa,type = "l",main="Mean Sea Level Pressure (hPa)")

plot(madrid$Mean.Wind.SpeedKm.h,type = "l",main="Mean Windspeed (km/h)")

plot(madrid$Precipitationmm,type = "l",main="Precipitation (mm)")

madrid$Events <- as.factor(madrid$Events)

plot(madrid$Events,main="Events",las=2)

plot(madrid$Precipitationmm[1:4000],type = "l",main="Precipitation (mm) first 4000 days",col="red")

require(stringr)
## Loading required package: stringr
rainydays <- which(grepl(x=madrid$Events[1:4000],pattern="Rain",ignore.case = T))

abline(v=rainydays,lty=3,lwd=0.1)

plot(madrid$Precipitationmm[4000:6809],type = "l",main="Precipitation (mm) last 2809 days",col="red")

require(stringr)

rainydays <- which(grepl(x=madrid$Events[4000:6809],pattern="Rain",ignore.case = T))

abline(v=rainydays,lty=3,lwd=0.1)