library(tidyverse)
## -- Attaching packages --------------------------------------------------------------- tidyverse 1.3.0 --
## v ggplot2 3.3.2     v purrr   0.3.4
## v tibble  3.0.1     v dplyr   1.0.0
## v tidyr   1.1.0     v stringr 1.4.0
## v readr   1.3.1     v forcats 0.5.0
## -- Conflicts ------------------------------------------------------------------ tidyverse_conflicts() --
## x dplyr::filter() masks stats::filter()
## x dplyr::lag()    masks stats::lag()
library(forecast)
## Registered S3 method overwritten by 'quantmod':
##   method            from
##   as.zoo.data.frame zoo
library(pastecs)
## 
## Attaching package: 'pastecs'
## The following objects are masked from 'package:dplyr':
## 
##     first, last
## The following object is masked from 'package:tidyr':
## 
##     extract
contract_payments_all <- read.csv('Lambda_cleanpayments.csv')

View(contract_payments_all)
#rename columns
colnames(contract_payments_all) [1] <- "month"

#create separate dataframes for actual and expected
contract_payments_actual <- filter(contract_payments_all, e.or.a == "actual")
contract_payments_expected <- filter(contract_payments_all, e.or.a == "expected")

#create separate dataframes for new and cumulative
contract_payments_new <- filter(contract_payments_all, n.or.c == "new")
contract_payments_cumulative <- filter(contract_payments_all, n.or.c == "cumulative")
#descriptive stats
stat.desc(contract_payments_new)
##          month         year n.or.c e.or.a paying.contracts
## nbr.val     NA 2.400000e+01     NA     NA       17.0000000
## nbr.null    NA 0.000000e+00     NA     NA        0.0000000
## nbr.na      NA 0.000000e+00     NA     NA        7.0000000
## min         NA 2.020000e+03     NA     NA        3.0000000
## max         NA 2.021000e+03     NA     NA       41.0000000
## range       NA 1.000000e+00     NA     NA       38.0000000
## sum         NA 4.848200e+04     NA     NA      337.0000000
## median      NA 2.020000e+03     NA     NA       20.0000000
## mean        NA 2.020083e+03     NA     NA       19.8235294
## SE.mean     NA 5.763034e-02     NA     NA        2.4573349
## CI.mean     NA 1.192174e-01     NA     NA        5.2093173
## var         NA 7.971014e-02     NA     NA      102.6544118
## std.dev     NA 2.823299e-01     NA     NA       10.1318513
## coef.var    NA 1.397615e-04     NA     NA        0.5111023
stat.desc(contract_payments_cumulative)
##          month         year n.or.c e.or.a paying.contracts
## nbr.val     NA 2.400000e+01     NA     NA       17.0000000
## nbr.null    NA 0.000000e+00     NA     NA        0.0000000
## nbr.na      NA 0.000000e+00     NA     NA        7.0000000
## min         NA 2.020000e+03     NA     NA        3.0000000
## max         NA 2.021000e+03     NA     NA      266.0000000
## range       NA 1.000000e+00     NA     NA      263.0000000
## sum         NA 4.848200e+04     NA     NA     1641.0000000
## median      NA 2.020000e+03     NA     NA       71.0000000
## mean        NA 2.020083e+03     NA     NA       96.5294118
## SE.mean     NA 5.763034e-02     NA     NA       20.9230238
## CI.mean     NA 1.192174e-01     NA     NA       44.3548290
## var         NA 7.971014e-02     NA     NA     7442.1397059
## std.dev     NA 2.823299e-01     NA     NA       86.2678370
## coef.var    NA 1.397615e-04     NA     NA        0.8936948
#graph new
ggplot(contract_payments_new, aes(x=month, y=paying.contracts))+
  geom_bar(stat = 'identity', aes(fill = month, colour = month))+
  scale_fill_brewer(palette = "Paired")+
  scale_x_discrete(name = "Month", limits=c("Feb", "Mar", "Apr", "May", "June", "July", "Aug", "Sept", "Oct", "Nov", "Dec", "Jan"))+
  facet_grid(rows = vars(e.or.a))+
  ggtitle("New Lambda Contracts")+
  ylab("# of Paying Contracts")+
  theme_bw()+
  theme(axis.text = element_text(size = 12), axis.title = element_text(size = 14), plot.title = element_text(size = 18), legend.title = element_text(size = 14), plot.title.position = "panel")
## Warning: Removed 7 rows containing missing values (position_stack).

#graph cumulative
ggplot(contract_payments_cumulative, aes(x=month, y=paying.contracts))+
  geom_bar(stat = 'identity', aes(fill = month, colour = month))+
  scale_fill_brewer(palette = "Set3")+
  scale_x_discrete(name = "Month", limits=c("Feb", "Mar", "Apr", "May", "June", "July", "Aug", "Sept", "Oct", "Nov", "Dec", "Jan"))+
  facet_grid(rows = vars(e.or.a))+
  ggtitle("Cumulative Lambda Contracts")+
  ylab("# of Paying Contracts")+
  theme_bw()+
  theme(axis.text = element_text(size = 12), axis.title = element_text(size = 14), plot.title = element_text(size = 18), legend.title = element_text(size = 14), plot.title.position = "panel")
## Warning: Removed 7 rows containing missing values (position_stack).