1 Tahap Persiapan

Melakukan Instalasi Packages yang Diperlukan.

library(forecast)

## Registered S3 method overwritten by 'quantmod':
##   method            from
##   as.zoo.data.frame zoo

library(TTR)
library(TSA)

## Registered S3 methods overwritten by 'TSA':
##   method       from    
##   fitted.Arima forecast
##   plot.Arima   forecast

## 
## Attaching package: 'TSA'

## The following objects are masked from 'package:stats':
## 
##     acf, arima

## The following object is masked from 'package:utils':
## 
##     tar

library(graphics)
library(tseries)
library(readxl)

dataawal <- read_xlsx("D:/Data R SEI/data ARW.xlsx")
data1 <- dataawal [-111:-120,]
data2 <- dataawal [-1:-110,]

data1 merupakan data yang akan digunakan untuk mengidentifikasi model dan meramal 10 waktu kedepan, sedangkan data2 akan digunakan untuk mengetes tingkat akurasi model.

data.ts <- ts(data1)
head(data.ts)

## Time Series:
## Start = 1 
## End = 6 
## Frequency = 1 
##      Sales (in thousands)
## [1,]              10618.1
## [2,]              10537.9
## [3,]              10209.3
## [4,]              10553.0
## [5,]               9934.9
## [6,]              10534.5

ts.plot(data.ts, xlab = "Time Period", ylab = "Sales", main = "Time Series Plot Data Sales")
points(data.ts)

Setelah proses persiapan sudah selesai, langkah selanjutnya adalah mengidentifikasi model yang sesuai.

2 Model ARIMA

adf.test(data.ts)

## Warning in adf.test(data.ts): p-value smaller than printed p-value

## 
##  Augmented Dickey-Fuller Test
## 
## data:  data.ts
## Dickey-Fuller = -5.9291, Lag order = 4, p-value = 0.01
## alternative hypothesis: stationary

acf(data.ts)

pacf(data.ts, lag.max = 50)

eacf(data.ts)

## AR/MA
##   0 1 2 3 4 5 6 7 8 9 10 11 12 13
## 0 o o x o o o o o o o o  o  o  o 
## 1 o o o o o o o o o o o  o  o  o 
## 2 o x o o o o o o o o o  o  o  o 
## 3 x o o o o o o o o o o  o  o  o 
## 4 x o o o o o o o o o o  o  o  o 
## 5 o o x o o o o o o o o  o  o  o 
## 6 x o o o o o o o o o o  o  o  o 
## 7 x x o o x o o o o o o  o  o  o

Berdasarkan Augmented Dickey-Fuller Test data yang digunakan sudah stasioner dikarenakan nilai p-value = 0,01 < 0.05 sehingga dapat langsung melihat plot ACF, PACF dan EACF untuk mendapatkan kandidat model. Berdasarkan ketiga plot tersebut, berikut kandidat model yang sesuai ACF = kandidat model 1 : ARIMA (0,0,3) PACF = kandidat model 2 : ARIMA (3,0,0) EACF = kandidat model 3 : ARIMA (1,0,1) EACF = kandidat model 4 : ARIMA (1,0,2) EACF = kandidat model 4 : ARIMA (3,0,1).

#Penentuan Model Terbaik Berdasarkan AIC

arima(data.ts, order = c(0,0,3), method = "ML")

## 
## Call:
## arima(x = data.ts, order = c(0, 0, 3), method = "ML")
## 
## Coefficients:
##          ma1      ma2      ma3   intercept
##       0.0141  -0.0518  -0.2326  10374.4514
## s.e.  0.1002   0.1171   0.0967     14.9337
## 
## sigma^2 estimated as 45079:  log likelihood = -745.56,  aic = 1499.12

arima(data.ts, order = c(3,0,0), method = "ML")

## 
## Call:
## arima(x = data.ts, order = c(3, 0, 0), method = "ML")
## 
## Coefficients:
##          ar1     ar2      ar3   intercept
##       0.0904  0.0086  -0.2312  10374.9540
## s.e.  0.0927  0.0929   0.0926     17.9023
## 
## sigma^2 estimated as 44745:  log likelihood = -745.15,  aic = 1498.3

arima(data.ts, order = c(1,0,1), method = "ML")

## 
## Call:
## arima(x = data.ts, order = c(1, 0, 1), method = "ML")
## 
## Coefficients:
##          ar1     ma1   intercept
##       0.0672  0.0246  10375.1957
## s.e.  0.4398  0.4314     22.7734
## 
## sigma^2 estimated as 47350:  log likelihood = -748.18,  aic = 1502.36

arima(data.ts, order = c(3,0,1), method = "ML")

## 
## Call:
## arima(x = data.ts, order = c(3, 0, 1), method = "ML")
## 
## Coefficients:
##          ar1      ar2      ar3      ma1   intercept
##       0.6498  -0.0437  -0.2197  -0.6094  10374.0433
## s.e.  0.2868   0.1149   0.1105   0.2950     12.8663
## 
## sigma^2 estimated as 43484:  log likelihood = -743.64,  aic = 1497.28

Berdasarkan nilai AIC, model yang mempunyai AIC terkecil adalah model ARIMA (3,0,1) sehingga model yang akan digunakan untuk peramalan adalah model ARIMA (3,0,1).

ARIMA_data <- Arima(data.ts, order = c(3,0,1), method = "ML")

3 Peramalan 10 Waktu ke Depan

Setelah mendapatkan model terbaik, selanjutnya dilakukan peramalan untuk 10 waktu ke depan.

hasil_forecast <- forecast(ARIMA_data)
hasil_forecast <- as.data.frame(hasil_forecast)
hasil_forecast

plot(hasil_forecast, main = "Forecast from ARIMA (3,0,1) With Non-Zero Mean")

Setiap panel mewakili titik prediksi tertentu bersama interval prediksinya.

Label seperti “Lo 80”, “Hi 80”, “Lo 95”, dan “Hi 95” menunjukkan batas bawah (low) dan batas atas (high) untuk interval kepercayaan 80% dan 95%.

4 Penilaian Akurasi dengan MAPE

Penilaian akurasi dilakukan dengan membandingkan data hasil ramalan dengan data aktual 10 amatan terakhir.

data_forecast1 <- hasil_forecast$`Point Forecast`
data_forecast1 <- as.data.frame(data_forecast1)
head(data_forecast1)

dataaktual <- as.data.frame(data2)
dataaktual

akurasi.arima <- accuracy(data_forecast1$data_forecast1,dataaktual$`Sales (in thousands)`)
akurasi.arima

##                ME     RMSE      MAE       MPE     MAPE
## Test set 53.57804 193.8149 161.3917 0.4821229 1.538676

Jika nilai MAPE kecil maka kesalahan hasil pendugaannya juga kecil. Peramalan penjualan menggunakan metode ARIMA dinilai memiliki kemampuan ramalan yang sangat akurat karena hasil dari MAPE adalah sebesar 1.538676%.

5 Simple Exponential Smoothing

plot(data.ts,main="Plot Semua Data")
points(data.ts)

data1.ses<-HoltWinters(data.ts,alpha=0.1, beta=FALSE, gamma=FALSE)
data1.ses

## Holt-Winters exponential smoothing without trend and without seasonal component.
## 
## Call:
## HoltWinters(x = data.ts, alpha = 0.1, beta = FALSE, gamma = FALSE)
## 
## Smoothing parameters:
##  alpha: 0.1
##  beta : FALSE
##  gamma: FALSE
## 
## Coefficients:
##       [,1]
## a 10393.24

SSE <- data1.ses$SSE
SSE

## [1] 5954375

MSE <- SSE/110
MSE

## [1] 54130.69

hasil_forecast.sess <- forecast(data1.ses)
hasil_forecast.ses <- as.data.frame(hasil_forecast.sess)
hasil_forecast.ses

plot(hasil_forecast.sess)

Garis biru mewakili prediksi titik, area berbayang biru tua menunjukkan interval prediksi 80% dan area berbayang biru muda menunjukkan interval prediksi 95% untuk prediksi titik.

data_forecast2 <- hasil_forecast.ses$`Point Forecast`
data_forecast2 <- as.data.frame(data_forecast2)
head(data_forecast2)

dataaktual <- as.data.frame(data2)
dataaktual

akurasi.ses <- accuracy(data_forecast2$data_forecast2,dataaktual$`Sales (in thousands)`)
akurasi.ses

##                ME     RMSE   MAE       MPE     MAPE
## Test set 31.73833 189.8569 161.3 0.2723997 1.540696

6 Perbandingan Model ARIMA dan Exponential Smoothing Forecasts

Setelah dilakukan peramalan dengan menggunakan dua metode, akan diamati nilai MAPE dari masing-masing metode. Metode dengan nilai MAPE paling kecil akan terpilih menjadi model terbaik.

akurasi.arima

##                ME     RMSE      MAE       MPE     MAPE
## Test set 53.57804 193.8149 161.3917 0.4821229 1.538676

akurasi.ses

##                ME     RMSE   MAE       MPE     MAPE
## Test set 31.73833 189.8569 161.3 0.2723997 1.540696

Hasil dari kedua metode tersebut menghasilkan nilai MAPE 1.538676% untuk metode ARIMA dan 1.540696% untuk metode Simple Exponential Smoothing. Dengan demikian, metode yang mempunyai MAPE lebih kecil adalah metode ARIMA (3,0,1) dengan nilai p=3,d=0,q=1.

7 Interval Prediksi ARIMA

Berikut interval prediksi dari hasil ramalan model ARIMA (3,0,1)

fit <- Arima(data.ts, order=c(3,0,1), method="ML")
fit

## Series: data.ts 
## ARIMA(3,0,1) with non-zero mean 
## 
## Coefficients:
##          ar1      ar2      ar3      ma1        mean
##       0.6498  -0.0437  -0.2197  -0.6094  10374.0433
## s.e.  0.2868   0.1149   0.1105   0.2950     12.8663
## 
## sigma^2 = 45555:  log likelihood = -743.64
## AIC=1499.28   AICc=1500.1   BIC=1515.49

hasil_forecast

interval.prediction <- hasil_forecast[,-1]
interval.prediction

plot(hasil_forecast$`Point Forecast`, type="n", ylim=range(hasil_forecast$`Lo 80`,hasil_forecast$`Hi 80`))
polygon(c(time(hasil_forecast$`Point Forecast`),rev(time(hasil_forecast$`Point Forecast`))), c(hasil_forecast$`Hi 80`,rev(hasil_forecast$`Lo 80`)), 
   col=rgb(0,0,0.6,0.2), border=FALSE)
lines(hasil_forecast$`Point Forecast`)
lines(fitted(fit),col='red')

out <- (hasil_forecast$`Point Forecast`< hasil_forecast$`Lo 80` | hasil_forecast$`Point Forecast` > hasil_forecast$`Hi 80`)

plot(hasil_forecast$`Point Forecast`, type="n", ylim=range(hasil_forecast$`Lo 95`,hasil_forecast$`Hi 95`))
polygon(c(time(hasil_forecast$`Point Forecast`),rev(time(hasil_forecast$`Point Forecast`))), c(hasil_forecast$`Hi 95`,rev(hasil_forecast$`Lo 95`)), 
   col=rgb(0,0,0.6,0.2), border=FALSE)
lines(hasil_forecast$`Point Forecast`)
lines(fitted(fit),col='red')

out <- (hasil_forecast$`Point Forecast`< hasil_forecast$`Lo 95` | hasil_forecast$`Point Forecast` > hasil_forecast$`Hi 95`)

Berdasarkan kedua plot yaitu plot interval prediksi 80% dan plot interval prediksi 95% menunjukkan hasil yang hampir sama hanya berbeda di rentang selangnya. Interval prediksi 95% memiliki rentang yang lebih luas dari pada interval prediksi 80%.

8 Reference

Montgomery, D.C., et.al. 2008. Forecasting Time Series Analysis 2nd. John Wiley

Latihan Analisis Runtun Waktu

Lusia Clara Sianturi

2024-10-30