# Load packages
# Core
library(tidyverse)
library(tidyquant)
# Source function
source("../00_scripts/simulate_accumulation.R")
Revise the code below.
symbols <- c("TSLA", "GM", "F", "VWAGY", "HMC")
prices <- tq_get(x = symbols,
get = "stock.prices",
from = "2012-12-31",
to = "2023-04-27")
asset_returns_tbl <- prices %>%
group_by(symbol) %>%
tq_transmute(select = adjusted,
mutate_fun = periodReturn,
period = "monthly",
type = "log") %>%
slice(-1) %>%
ungroup() %>%
set_names(c("asset", "date", "returns"))
Revise the code for weights.
# symbols
symbols <- asset_returns_tbl %>% distinct(asset) %>% pull()
symbols
## [1] "F" "GM" "HMC" "TSLA" "VWAGY"
# weights
weights <- c(0.21, 0.25, 0.2, 0.2, 0.14)
weights
## [1] 0.21 0.25 0.20 0.20 0.14
w_tbl <- tibble(symbols, weights)
w_tbl
## # A tibble: 5 × 2
## symbols weights
## <chr> <dbl>
## 1 F 0.21
## 2 GM 0.25
## 3 HMC 0.2
## 4 TSLA 0.2
## 5 VWAGY 0.14
portfolio_returns_tbl <- asset_returns_tbl %>%
tq_portfolio(assets_col = asset,
returns_col = returns,
weights = w_tbl,
rebalance_on = "months",
col_rename = "returns")
portfolio_returns_tbl
## # A tibble: 124 × 2
## date returns
## <date> <dbl>
## 1 2013-01-31 0.0285
## 2 2013-02-28 -0.0464
## 3 2013-03-28 0.0246
## 4 2013-04-30 0.118
## 5 2013-05-31 0.173
## 6 2013-06-28 -0.00187
## 7 2013-07-31 0.105
## 8 2013-08-30 0.0137
## 9 2013-09-30 0.0648
## 10 2013-10-31 -0.00692
## # … with 114 more rows
# Get mean portfolio return
mean_port_return <- mean(portfolio_returns_tbl$returns)
mean_port_return
## [1] 0.00784757
# Get standard deviation of portfolio returns
stddev_port_return <- sd(portfolio_returns_tbl$returns)
stddev_port_return
## [1] 0.07688214
No need
#Create a vector of 1s as a starting point
sims <- 51
starts <- rep(100, sims) %>%
set_names(paste0("sim", 1:sims))
starts
## sim1 sim2 sim3 sim4 sim5 sim6 sim7 sim8 sim9 sim10 sim11 sim12 sim13
## 100 100 100 100 100 100 100 100 100 100 100 100 100
## sim14 sim15 sim16 sim17 sim18 sim19 sim20 sim21 sim22 sim23 sim24 sim25 sim26
## 100 100 100 100 100 100 100 100 100 100 100 100 100
## sim27 sim28 sim29 sim30 sim31 sim32 sim33 sim34 sim35 sim36 sim37 sim38 sim39
## 100 100 100 100 100 100 100 100 100 100 100 100 100
## sim40 sim41 sim42 sim43 sim44 sim45 sim46 sim47 sim48 sim49 sim50 sim51
## 100 100 100 100 100 100 100 100 100 100 100 100
#Simulate
#For reproducible research
set.seed(1234)
monte_carlo_sim_51 <- starts %>%
#Simulate
map_dfc(.x = .,
.f = ~simulate_accumulation(initial_value = .x,
N = 240,
mean_return = mean_port_return,
sd_return = stddev_port_return)) %>%
#Add
mutate(month = 1:nrow(.)) %>%
select(month, everything()) %>%
# Rearrange column names
set_names(c("month", names(starts))) %>%
#Transform to long form
pivot_longer(cols = -month, names_to = "sim", values_to = "growth")
monte_carlo_sim_51
## # A tibble: 12,291 × 3
## month sim growth
## <int> <chr> <dbl>
## 1 1 sim1 100
## 2 1 sim2 100
## 3 1 sim3 100
## 4 1 sim4 100
## 5 1 sim5 100
## 6 1 sim6 100
## 7 1 sim7 100
## 8 1 sim8 100
## 9 1 sim9 100
## 10 1 sim10 100
## # … with 12,281 more rows
#Find quantiles
monte_carlo_sim_51 %>%
group_by(sim) %>%
summarise(growth = last(growth)) %>%
ungroup() %>%
pull(growth) %>%
quantile(probs = c(0, 0.25, 0.5, 0.75, 1)) %>%
round(2)
## 0% 25% 50% 75% 100%
## 7.46 109.95 323.59 525.40 2701.19
Line Plot of Simulations with Max, Median, and Min
monte_carlo_sim_51 %>%
ggplot(aes(x = month, y = growth, color = sim)) +
geom_line() +
theme(legend.position = "none") +
theme(plot.title = element_text(hjust = 0.5)) +
labs(title = "Simulating growth of $100 over 240 months")
Line plot with max, median, and min
#Step 1 Summarize data into max, median, and min of last value
sim_summary <- monte_carlo_sim_51 %>%
group_by(sim) %>%
summarise(growth = last(growth)) %>%
ungroup() %>%
summarise(max = max(growth),
median = median(growth),
min = min(growth))
sim_summary
## # A tibble: 1 × 3
## max median min
## <dbl> <dbl> <dbl>
## 1 2701. 324. 7.46
#Step 2 Plot
monte_carlo_sim_51 %>%
#Filter for max, median, and min sim
group_by(sim) %>%
filter(last(growth) == sim_summary$max |
last(growth) == sim_summary$median |
last(growth) == sim_summary$min) %>%
ungroup() %>%
#Plot
ggplot(aes(x = month, y = growth, color = sim)) +
geom_line() +
theme(legend.position = "none") +
theme(plot.title = element_text(hjust = 0.5)) +
theme(plot.subtitle = element_text(hjust = 0.5)) +
labs(title = "Simulating growth of $100 over 240 months", subtitle = "Maximum, Median, and Minimum Simulation")
Based on the Monte Carlo simulation results, how much should you expect from your $100 investment after 20 years? What is the best-case scenario? What is the worst-case scenario? What are limitations of this simulation analysis?
Looking at the maximum, median, and min simulation chart showed a mean of around $250. That would be a 250% return on the $100 investment in 20 years. This being the median, it would be around what you would expect from investing $100 in this portfolio. The maximum was around $2,750. Looking at the graph with more information, the maximum was $750 higher than the next closes return at the end of the 240 month period. The minimum was $0, losing all of the investment...
One limitation is using rnorm, which assumes normal distribution of returns, making the results more optimistic. A second limition is the dataset that we used, it was from 2012 to present, with a mean probably on the high side, making the analysis on the high side. You could expand the dates to include more of the past market...