Part A: Moving Average
#install.packages("dplyr")
#install.packages("zoo")
library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(zoo)
##
## Attaching package: 'zoo'
## The following objects are masked from 'package:base':
##
## as.Date, as.Date.numeric
Import data
df <- data.frame(month=c(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12),
contracts=c(240,352,230,260,280,322,220,310,240,310,240,230))
Identify descriptive statistics
summary(df)
## month contracts
## Min. : 1.00 Min. :220.0
## 1st Qu.: 3.75 1st Qu.:237.5
## Median : 6.50 Median :250.0
## Mean : 6.50 Mean :269.5
## 3rd Qu.: 9.25 3rd Qu.:310.0
## Max. :12.00 Max. :352.0
Interpretation: The average contract value over a 12 month period is $269.5 million.
Create time series plot
plot(df$month, df$contracts, type = "o", col = "blue", xlab = "Month", ylab = "Contracts",
main = "Alabama Building Contracts Plot")

# The time series plot exhibits a random variation
Manually calculate the three-month moving average
# Calculate the three-month moving average manually
df$avg_contracts3 <- c(NA, NA,
(df$contracts[1] + df$contracts[2] + df$contracts[3]) / 3,
(df$contracts[2] + df$contracts[3] + df$contracts[4]) / 3,
(df$contracts[3] + df$contracts[4] + df$contracts[5]) / 3,
(df$contracts[4] + df$contracts[5] + df$contracts[6]) / 3,
(df$contracts[5] + df$contracts[6] + df$contracts[7]) / 3,
(df$contracts[6] + df$contracts[7] + df$contracts[8]) / 3,
(df$contracts[7] + df$contracts[8] + df$contracts[9]) / 3,
(df$contracts[8] + df$contracts[9] + df$contracts[10]) / 3,
(df$contracts[9] + df$contracts[10] + df$contracts[11]) / 3,
(df$contracts[10] + df$contracts[11] + df$contracts[12]) / 3
)
Calculate squared errors (For months where moving average is
available)
df <- df %>%
mutate(
squared_error= ifelse(is.na(avg_contracts3), NA, (contracts - avg_contracts3)^2)
)
Compute MSE (excluding initial months with NA values)
mse <- mean(df$squared_error, na.rm = TRUE)
mse #MSE is 2040.44
## [1] 996.8
Part B: Exponential smoothing
alpha <- 0.2
exp_smooth <- rep(NA, length(df$contracts))
exp_smooth[1] <- df$contracts[1] #starting point
for (i in 2: length(df$contracts)) {
exp_smooth[i] <- alpha * df$contracts[i-1] + (1 - alpha) * exp_smooth[i-1]
}
mse_exp_smooth <- mean((df$contracts[2:12] - exp_smooth[2:12])^2)
mse_exp_smooth #MSE is 2593.76
## [1] 2593.762
Compare the three-month moving average approach with the exponential
smoothing approach to see which one is more accurate:
better_method <- ifelse(mse < mse_exp_smooth, "3 month moving average", "exponential smoothing")
Conclusion
list(
MSE_Moving_Average = mse,
MSE_Exponential_Smoothing = mse_exp_smooth,
Better_Method = better_method
)
## $MSE_Moving_Average
## [1] 996.8
##
## $MSE_Exponential_Smoothing
## [1] 2593.762
##
## $Better_Method
## [1] "3 month moving average"
The three month moving average provides more accurate forecasts based on MSE.