Homework5

library(tidyverse)
library(fpp3)
library(broom)
library(yardstick)

8.1

# Loading data
data("aus_livestock")

# Filter for pigs in Victoria
pigs_vic <- aus_livestock %>%
  filter(Animal == "Pigs", State == "Victoria")

Use the ETS() function to estimate the equivalent model for simple exponential smoothing. Find the optimal values and generate forecasts for the next four months.

# Fit ETS model (equivalent to simple exponential smoothing)
ets_model <- pigs_vic %>%
    model(ETS(Count ~ error("A") + trend("N") + season("N")))

# Extract optimal alpha and initial level
report(ets_model)

## Series: Count 
## Model: ETS(A,N,N) 
##   Smoothing parameters:
##     alpha = 0.3221247 
## 
##   Initial states:
##      l[0]
##  100646.6
## 
##   sigma^2:  87480760
## 
##      AIC     AICc      BIC 
## 13737.10 13737.14 13750.07

The ideal alpha value is 0.3221247, and the optimal initial state value is 100646.6.

# Generate forecasts for the next four months
forecasts_4m <- ets_model %>%
  forecast(h = 4, level = c(95))

# Checking forecasts
forecasts_4m

## # A fable: 4 x 6 [1M]
## # Key:     Animal, State, .model [1]
##   Animal State    .model                                                   Month
##   <fct>  <fct>    <chr>                                                    <mth>
## 1 Pigs   Victoria "ETS(Count ~ error(\"A\") + trend(\"N\") + season(\"… 2019 1月
## 2 Pigs   Victoria "ETS(Count ~ error(\"A\") + trend(\"N\") + season(\"… 2019 2月
## 3 Pigs   Victoria "ETS(Count ~ error(\"A\") + trend(\"N\") + season(\"… 2019 3月
## 4 Pigs   Victoria "ETS(Count ~ error(\"A\") + trend(\"N\") + season(\"… 2019 4月
## # ℹ 2 more variables: Count <dist>, .mean <dbl>

Compute a 95% prediction interval for the first forecast. Compare your interval with the interval produced by R.

# Calculate sd
residuals_sd <- ets_model %>% augment() %>% pull(.resid) %>% sd()

# Obtain the first forecast
first_forecast <- forecasts_4m %>% slice(1) %>% pull(.mean)

# Calculate 95% interval
lower_bound <- first_forecast - 1.96 * residuals_sd
upper_bound <- first_forecast + 1.96 * residuals_sd

# Show manually calculated interval
c(lower_bound, upper_bound)

## [1]  76871.01 113502.10

# Check R calculated interval
sigma = 87480760
sqrt_sigma <- sqrt(sigma)

lower <- first_forecast - 1.96 * sqrt_sigma
upper <- first_forecast + 1.96 * sqrt_sigma
c(lower, upper)

## [1]  76854.45 113518.66

The manually calculated interval is 76871.01 - 113502.10, and the R calculated interval is 76854.45 - 113518.66. The intervals are quite similar, with a difference of about sixteen.

8.5

Load and Plot the Data

# Load dataset
data("global_economy")

# Select a country
exports_data <- global_economy %>%
  filter(Country == "United States") %>%
  select(Year, Exports) %>%
  drop_na() %>%  # Remove missing values
  as_tsibble(index = Year)

# Plot the Exports series
autoplot(exports_data, Exports) +
  labs(title = "Annual Exports of the United States",
       y = "Exports (in USD)")

Fit an ETS(A,N,N) Model

# Fit ETS(A,N,N) model
ets_ann <- exports_data %>%
  model(ETS(Exports ~ error("A") + trend("N") + season("N")))

# Forecast
fc_ann <- ets_ann %>%
  forecast(h = 10)

# Plot Forecasts
autoplot(exports_data, Exports) +
  autolayer(fc_ann, level = 95) +
  labs(title = "ETS(A,N,N) Forecast for Exports")

print(fc_ann)

## # A fable: 10 x 4 [1Y]
## # Key:     .model [1]
##    .model                                                        Year
##    <chr>                                                        <dbl>
##  1 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2017
##  2 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2018
##  3 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2019
##  4 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2020
##  5 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2021
##  6 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2022
##  7 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2023
##  8 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2024
##  9 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2025
## 10 "ETS(Exports ~ error(\"A\") + trend(\"N\") + season(\"N\"))"  2026
## # ℹ 2 more variables: Exports <dist>, .mean <dbl>

Fit an ETS(A,A,N) Model

# Fit ETS(A,A,N) model
ets_aan <- exports_data %>%
  model(ETS(Exports ~ error("A") + trend("A") + season("N")))

# Forecast
fc_aan <- ets_aan %>%
  forecast(h = 10)

# Plot Forecasts
autoplot(exports_data, Exports) +
  autolayer(fc_aan, level = 95) +
  labs(title = "ETS(A,A,N) Forecast for Exports")

print(fc_aan)

## # A fable: 10 x 4 [1Y]
## # Key:     .model [1]
##    .model                                                        Year
##    <chr>                                                        <dbl>
##  1 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2017
##  2 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2018
##  3 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2019
##  4 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2020
##  5 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2021
##  6 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2022
##  7 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2023
##  8 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2024
##  9 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2025
## 10 "ETS(Exports ~ error(\"A\") + trend(\"A\") + season(\"N\"))"  2026
## # ℹ 2 more variables: Exports <dist>, .mean <dbl>

Compute RMSE for ETS(A,N,N) and ETS(A,A,N)

# For ETS(A,N,N) model
fitted_ann <- ets_ann %>% fitted()  # Contains .fitted values and the index
comparison_ann <- left_join(exports_data, fitted_ann, by = "Year")

# For ETS(A,A,N) model
fitted_aan <- ets_aan %>% fitted()
comparison_aan <- left_join(exports_data, fitted_aan, by = "Year")

# RMSE for ETS(A,N,N)
rmse_ets_ann <- sqrt(mean((comparison_ann$Exports - comparison_ann$.fitted)^2, na.rm = TRUE))

# RMSE for ETS(A,A,N)
rmse_ets_aan <- sqrt(mean((comparison_aan$Exports - comparison_aan$.fitted)^2, na.rm = TRUE))

# Print RMSE values
cat("RMSE for ETS(A,N,N):", rmse_ets_ann, "\n")

## RMSE for ETS(A,N,N): 0.6270672

cat("RMSE for ETS(A,A,N):", rmse_ets_aan, "\n")

## RMSE for ETS(A,A,N): 0.6149566

Compare Forecasts

Due to the clear upward trend in export data, the ETS(AAN) is the better choice and we can see it from the RMSE values. Moreover, this trend is expected to continue, as AAN provides more accurate long-term predictions.

Calculate 95% Prediction Intervals

Manually calculated interval:

# Compute prediction intervals for first forecast
first_fc_ann <- fc_ann$.mean[1]
first_fc_aan <- fc_aan$.mean[1]

pi95_ann <- c(first_fc_ann - 1.96 * rmse_ets_ann, first_fc_ann + 1.96 * rmse_ets_ann)
pi95_aan <- c(first_fc_aan - 1.96 * rmse_ets_aan, first_fc_aan + 1.96 * rmse_ets_aan)

pi95_ann

## [1] 10.66163 13.11974

pi95_aan

## [1] 10.80130 13.21193

R calculated interval:

lower_ann <- first_fc_ann - 0.41
upper_ann <- first_fc_ann + 0.41

# Show interval
c(lower_ann, upper_ann)

## [1] 11.48068 12.30068

lower_aan <- first_fc_aan - 0.41
upper_aan <- first_fc_aan + 0.41

# Show interval
c(lower_aan, upper_aan)

## [1] 11.59661 12.41661

The intervals generated by R are smaller compared to those calculated manually.

8.6

Extract and Prepare Data

# Filter Data
china_gdp <- global_economy %>%
  filter(Country == "China") %>%
  select(Year, GDP) %>%
  mutate(Year = as.numeric(Year)) %>%
  as_tsibble(index = Year)

# Plot the GDP series
autoplot(china_gdp, GDP) +
  labs(title = "Annual GDP of China",
       y = "GDP")

Fit Different ETS Models and Generate Forecasts

# Automatic ETS model selection
gdp_ets <- china_gdp %>% model(ETS(GDP))

# ETS with a damped trend (explicitly defined)
gdp_ets_damped <- china_gdp %>%
  model(ETS(GDP ~ error("A") + trend("Ad") + season("N")))

# ETS with Box-Cox transformation (log transformation)
gdp_ets_bc <- china_gdp %>% model(ETS(box_cox(GDP, lambda = 0)))

fc_ets <- gdp_ets %>% forecast(h = 20)
fc_ets_damped <- gdp_ets_damped %>% forecast(h = 20)
fc_ets_bc <- gdp_ets_bc %>% forecast(h = 20)

print(fc_ets)

## # A fable: 20 x 4 [1Y]
## # Key:     .model [1]
##    .model    Year
##    <chr>    <dbl>
##  1 ETS(GDP)  2018
##  2 ETS(GDP)  2019
##  3 ETS(GDP)  2020
##  4 ETS(GDP)  2021
##  5 ETS(GDP)  2022
##  6 ETS(GDP)  2023
##  7 ETS(GDP)  2024
##  8 ETS(GDP)  2025
##  9 ETS(GDP)  2026
## 10 ETS(GDP)  2027
## 11 ETS(GDP)  2028
## 12 ETS(GDP)  2029
## 13 ETS(GDP)  2030
## 14 ETS(GDP)  2031
## 15 ETS(GDP)  2032
## 16 ETS(GDP)  2033
## 17 ETS(GDP)  2034
## 18 ETS(GDP)  2035
## 19 ETS(GDP)  2036
## 20 ETS(GDP)  2037
## # ℹ 2 more variables: GDP <dist>, .mean <dbl>

print(fc_ets_damped)

## # A fable: 20 x 4 [1Y]
## # Key:     .model [1]
##    .model                                                     Year
##    <chr>                                                     <dbl>
##  1 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2018
##  2 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2019
##  3 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2020
##  4 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2021
##  5 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2022
##  6 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2023
##  7 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2024
##  8 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2025
##  9 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2026
## 10 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2027
## 11 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2028
## 12 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2029
## 13 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2030
## 14 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2031
## 15 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2032
## 16 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2033
## 17 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2034
## 18 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2035
## 19 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2036
## 20 "ETS(GDP ~ error(\"A\") + trend(\"Ad\") + season(\"N\"))"  2037
## # ℹ 2 more variables: GDP <dist>, .mean <dbl>

print(fc_ets_bc)

## # A fable: 20 x 4 [1Y]
## # Key:     .model [1]
##    .model                         Year              GDP   .mean
##    <chr>                         <dbl>           <dist>   <dbl>
##  1 ETS(box_cox(GDP, lambda = 0))  2018 t(N(30, 0.0088)) 1.38e13
##  2 ETS(box_cox(GDP, lambda = 0))  2019   t(N(30, 0.02)) 1.56e13
##  3 ETS(box_cox(GDP, lambda = 0))  2020  t(N(30, 0.033)) 1.76e13
##  4 ETS(box_cox(GDP, lambda = 0))  2021  t(N(31, 0.048)) 1.99e13
##  5 ETS(box_cox(GDP, lambda = 0))  2022  t(N(31, 0.066)) 2.25e13
##  6 ETS(box_cox(GDP, lambda = 0))  2023  t(N(31, 0.087)) 2.56e13
##  7 ETS(box_cox(GDP, lambda = 0))  2024   t(N(31, 0.11)) 2.90e13
##  8 ETS(box_cox(GDP, lambda = 0))  2025   t(N(31, 0.14)) 3.30e13
##  9 ETS(box_cox(GDP, lambda = 0))  2026   t(N(31, 0.17)) 3.76e13
## 10 ETS(box_cox(GDP, lambda = 0))  2027    t(N(31, 0.2)) 4.28e13
## 11 ETS(box_cox(GDP, lambda = 0))  2028   t(N(31, 0.24)) 4.89e13
## 12 ETS(box_cox(GDP, lambda = 0))  2029   t(N(32, 0.28)) 5.59e13
## 13 ETS(box_cox(GDP, lambda = 0))  2030   t(N(32, 0.33)) 6.41e13
## 14 ETS(box_cox(GDP, lambda = 0))  2031   t(N(32, 0.38)) 7.35e13
## 15 ETS(box_cox(GDP, lambda = 0))  2032   t(N(32, 0.44)) 8.44e13
## 16 ETS(box_cox(GDP, lambda = 0))  2033    t(N(32, 0.5)) 9.71e13
## 17 ETS(box_cox(GDP, lambda = 0))  2034   t(N(32, 0.56)) 1.12e14
## 18 ETS(box_cox(GDP, lambda = 0))  2035   t(N(32, 0.63)) 1.29e14
## 19 ETS(box_cox(GDP, lambda = 0))  2036   t(N(32, 0.71)) 1.49e14
## 20 ETS(box_cox(GDP, lambda = 0))  2037   t(N(32, 0.79)) 1.72e14

china_gdp %>%
  autoplot(GDP) +
  autolayer(fc_ets, GDP, color = "blue", alpha = 0.6) +
  autolayer(fc_ets_damped, GDP, color = "red", alpha = 0.6) +
  autolayer(fc_ets_bc, GDP, color = "green", alpha = 0.6) +
  labs(title = "Chinese GDP Forecasts using ETS Models",
       y = "GDP",
       x = "Year") +
  guides(colour = guide_legend(title = "Model"))

The impact of using a damped trend or Box-Cox transformation on forecasts.

The automatic ETS model identifies the best fit for the data while continuing past trends seamlessly. The damped trend approach slows down the trend over time, making it more conservative. The Box-Cox log transformation helps prevent extreme growth and stabilizes variance, making it particularly effective when dealing with exponential growth or increasing volatility.

8.7

# Load the dataset
gas_data <- aus_production %>% filter(!is.na(Gas))

# Plot the data
autoplot(gas_data, Gas)

# Fit an ETS model with automatic selection
fit_ets <- gas_data %>%
  model(ETS(Gas ~ error("M") + trend("A") + season("M")))

# Check the fitted model
report(fit_ets)

## Series: Gas 
## Model: ETS(M,A,M) 
##   Smoothing parameters:
##     alpha = 0.6528545 
##     beta  = 0.1441675 
##     gamma = 0.09784922 
## 
##   Initial states:
##      l[0]       b[0]      s[0]    s[-1]    s[-2]     s[-3]
##  5.945592 0.07062881 0.9309236 1.177883 1.074851 0.8163427
## 
##   sigma^2:  0.0032
## 
##      AIC     AICc      BIC 
## 1680.929 1681.794 1711.389

The multiplicative seasonality is necessary because the data shows seasonal fluctuations that increase proportionally as the overall level of the series rises.

# Forecast for the next few years
forecast_ets <- fit_ets %>% forecast(h = "3 years")

# Plot the forecast
autoplot(gas_data, Gas) +
  autolayer(forecast_ets, series = "ETS Forecast")

# Experiment with damped trend
fit_ets_damped <- gas_data %>%
  model(ETS(Gas ~ error("M") + trend("Ad") + season("M")))

# Forecast with damped trend
forecast_ets_damped <- fit_ets_damped %>% forecast(h = "3 years")

# Compare forecasts
autoplot(gas_data, Gas) +
  autolayer(forecast_ets, series = "ETS") +
  autolayer(forecast_ets_damped, series = "ETS Damped")

The damped trend does not enhance the forecasts because the phi value is 0.98, which is very close to 1. This indicates that the trend remains almost unchanged, making it nearly identical to the standard ETS model.

8.8

Why is multiplicative seasonality necessary for this series?

# Set seed and select a random retail series
set.seed(1048)
myseries <- aus_retail |>
  filter(`Series ID` == sample(aus_retail$`Series ID`, 1))

# Convert to time series format
myseries_ts <- myseries |> as_tsibble(index = Month)

# Create plot
autoplot(myseries_ts)

Multiplicative seasonality is required when seasonal variations increase or decrease proportionally with the level of the series.

Apply Holt-Winters’ multiplicative method to the data.

# Split data
train <- myseries_ts |> filter(year(Month) <= 2010)
test <- myseries_ts |> filter(year(Month) == 2011)

# Fit Holt-Winters Multiplicative Model (ETS with multiplicative components)
hw_model <- train |> model(ETS(Turnover ~ error("M") + trend("M") + season("M")))
hw_model_damped <- train |> model(ETS(Turnover ~ error("M") + trend("Md") + season("M"))) # Damped trend

# Compute fitted values and merge with training data
train_fitted_hw <- train |> left_join(fitted(hw_model), by = "Month")
train_fitted_hw_damped <- train |> left_join(fitted(hw_model_damped), by = "Month")

# Manually calculate RMSE for training set
rmse_hw <- train_fitted_hw |> rmse(truth = Turnover, estimate = .fitted)
rmse_hw_damped <- train_fitted_hw_damped |> rmse(truth = Turnover, estimate = .fitted)

# Compare RMSE values
cat("RMSE (Holt-Winters Multiplicative):", rmse_hw$.estimate, "\n")

## RMSE (Holt-Winters Multiplicative): 2.312277

cat("RMSE (Holt-Winters Multiplicative Damped):", rmse_hw_damped$.estimate, "\n")

## RMSE (Holt-Winters Multiplicative Damped): 2.308848

Utilize the Holt-Winters Multiplicative Damped Model, as it shows better performance on both training and test datasets. This implies that damping the trend helps mitigate overfitting and enhances forecast accuracy.

Check the residuals

# Extract residuals from the best model (Holt-Winters Multiplicative Damped)
residuals_hw_damped <- augment(hw_model_damped)

# Plot residuals (time plot)
residuals_hw_damped |> ggplot(aes(x = Month, y = .resid)) +
  geom_line() +
  ggtitle("Residuals of Holt-Winters Multiplicative Damped Model") +
  xlab("Month") +
  ylab("Residuals")

# ACF plot to check autocorrelation
residuals_hw_damped |> ACF(.resid) |> autoplot() +
  ggtitle("ACF of Residuals from Holt-Winters Multiplicative Damped Model")

# Perform Ljung-Box test for autocorrelation (lag = 12 for monthly data)
Box.test(residuals_hw_damped$.resid, lag = 12, type = "Ljung-Box")

## 
##  Box-Ljung test
## 
## data:  residuals_hw_damped$.resid
## X-squared = 19.699, df = 12, p-value = 0.073

The residuals exhibit characteristics of white noise, as indicated by the random lags observed in the ACF plot, which predominantly fall within the blue dashed lines. Additionally, the p-value is high (greater than 0.05), suggesting that there is no significant autocorrelation, further confirming that the residuals resemble white noise.

Finding the test set RMSE

# Convert forecasts to tibble to ensure correct structure
test_fc_hw <- forecast(hw_model, h = nrow(test)) |> as_tibble()
test_fc_hw_damped <- forecast(hw_model_damped, h = nrow(test)) |> as_tibble()

# Ensure `test` contains `Turnover`, and join it with forecasts correctly
test_results_hw <- test |> 
  rename(actual_Turnover = Turnover) |>  # Rename to avoid conflicts
  left_join(test_fc_hw, by = "Month") |> 
  select(Month, actual_Turnover, .mean) |> 
  drop_na()

test_results_hw_damped <- test |> 
  rename(actual_Turnover = Turnover) |> 
  left_join(test_fc_hw_damped, by = "Month") |> 
  select(Month, actual_Turnover, .mean) |> 
  drop_na()

# Calculate RMSE for test set
rmse_test_hw <- rmse(test_results_hw, truth = actual_Turnover, estimate = .mean)
rmse_test_hw_damped <- rmse(test_results_hw_damped, truth = actual_Turnover, estimate = .mean)

# Display Test RMSE values
cat("Test RMSE (Holt-Winters Multiplicative):", rmse_test_hw$.estimate, "\n")

## Test RMSE (Holt-Winters Multiplicative): 8.17349

cat("Test RMSE (Holt-Winters Multiplicative Damped):", rmse_test_hw_damped$.estimate, "\n")

## Test RMSE (Holt-Winters Multiplicative Damped): 7.544579

The Holt-Winters multiplicative method is outperforms the seasonal naive approach, as indicated by the RMSE values. The RMSE for the seasonal naive method is 96.80193, while the RMSE for the Holt-Winters multiplicative method is 8.17349. Furthermore, the damped method is performing even better, with the RMSE of 7.544579. A smaller RMSE (Root Mean Square Error) value signifies a better-fitting model, meaning its predictions are closer to the actual values.

8.9

STL decomposition + ETS approach

# Box-Cox transformation (λ chosen automatically)
lambda <- features(myseries_ts, features = guerrero)$.box_cox

# Apply STL decomposition
stl_decomp <- myseries_ts |> 
  mutate(Turnover_transformed = box_cox(Turnover, lambda)) |>  # Box-Cox transformation
  model(STL(Turnover_transformed ~ season(window = "periodic")))

# Extract seasonally adjusted data (removing seasonal component)
stl_adjusted <- components(stl_decomp) |> select(Month, season_adjust)

# Split into training and test set
train_stl <- stl_adjusted |> filter(year(Month) <= 2010)
test_stl <- stl_adjusted |> filter(year(Month) == 2011)

# Fit ETS model to seasonally adjusted data
ets_model <- train_stl |> model(ETS(season_adjust ~ error("M") + trend("M") + season("N")))

# Forecast seasonally adjusted values
ets_fc <- forecast(ets_model, h = nrow(test_stl))

# Reintroduce seasonality by adding the seasonal component back
seasonality <- components(stl_decomp) |> select(Month, season_year)

final_fc <- ets_fc |> left_join(seasonality, by = "Month") |> 
  mutate(final_forecast = inv_box_cox(.mean + season_year, lambda))

# Merge with test data for RMSE calculation
test_results_stl_ets <- test |> left_join(final_fc, by = "Month") |> 
  select(Month, Turnover, final_forecast) |> drop_na()

# Compute test RMSE
rmse_test_stl_ets <- rmse(test_results_stl_ets, truth = Turnover, estimate = final_forecast)

# Display RMSE
cat("Test RMSE (STL + ETS):", rmse_test_stl_ets$.estimate, "\n")

## Test RMSE (STL + ETS): 7.963473

Since the Holt-Winters Multiplicative Damped model has a lower RMSE, it is the better forecasting method for this dataset.