Using monthly data from January 2014M1 to 2017M12 estimate the followings: 1. Select at least five stocks from different industries (for the list of the firms in different industries see, https://biz.yahoo.com/p/sum_conameu.html).
#QC'd
###The original stocks significantly underperformed the risk free rate. So, found a hnadful of stocks with returns close to or above the risk free rate so don't have to deal with a negative sharpe ratio###
#New Stocks for Portfolio
#Amazon.com, Inc. (AMZN)- Speciality Retail
#Facebook, Inc. (FB) - Internet Content & Information
#The Procter & Gamble Company (PG) - Household & Personal Products
#Costco Wholesale Corporation (COST) - Discount Stores
#Cigna Corporation (CI) - Health Care Plans
#Clean Environment
rm(list=ls(all=TRUE))
cat("\014")
library("fPortfolio")
library("quantmod")
library("timeSeries")
library("tseries")
library("stats")
#Import stock data from yahoo (see Q6 assignment 1)
#to=Sys.Date()
#make sure 12-02 so that the data includes the month of 12/2017, 12/01 excludes 12/2017
YahooData <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI","^TNX","SPY"),.GlobalEnv, from = "2014-01-01", to= "2017-12-02", periodicity="monthly", return.class = "timeSeries")
- Construct a portfolio of the selected stocks and graph the efficient frontier.
2a. Find the optimum weights using MPT.
cat("The optimal weights of the portfolio:")
The optimal weights of the portfolio:
print(optimalweight_matrix)
[,1]
AMZN 0.11961207
FB 0.37405787
PG 0.03631253
COST 0.17368825
CI 0.29632928
#Test that all weights add to 1:
#cat("Test that all weights add to 1:")
#print(colSums(optimalweight_matrix))
2b. and 2c. Using the optimum weights and daily adjusted closing prices at the end of 2017 allocate $100.00 among among the selected stocks. On 1/1/2014, the portfolio will have a value of 100 as an index.
#Import daily stock adj closing prices from yahoo
YahooData_Daily <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI"),.GlobalEnv, from = "2014-01-02", to = "2018-10-31", periodicity="daily", return.class = "timeSeries")
#Calculate Daily Adjusted Returns
#Note, since day 1 you have $100, and it isn't affected by the return of the previous day, left out the first day of the returns when importing data)
daily_rAMZN <- diff(log(AMZN$AMZN.Adjusted))
daily_rFB <- diff(log(FB$FB.Adjusted))
daily_rPG <- diff(log(PG$PG.Adjusted))
daily_rCOST <- diff(log(COST$COST.Adjusted))
daily_rCI <- diff(log(CI$CI.Adjusted))
#Create equation for daily optimal returns of the portfolio
return_optimal_portfolio_daily = optimalweight_matrix[1,1]*daily_rAMZN + optimalweight_matrix[2,1]*daily_rFB + optimalweight_matrix[3,1]*daily_rPG + optimalweight_matrix[4,1]*daily_rCOST + optimalweight_matrix[5,1]*daily_rCI
mean_return <- mean(return_optimal_portfolio_daily)*252*4
# round(return_optimal_portfolio_daily,5)
# 100*(1+return_optimal_portfolio_daily[1])*(1+return_optimal_portfolio_daily[2])*(1+return_optimal_portfolio_daily[3])
# class(return_optimal_portfolio_daily)
#Use for loop to generate holding values for every day of the data series:
#######################################################################
newreturn = 1 + return_optimal_portfolio_daily
newreturn[1] <- newreturn[1]*100 #the value of the second day
# head(newreturn)
# tail(newreturn)
newdailyreturn = cumprod(newreturn)
#head(newdailyreturn)
#tail(newdailyreturn)
#length(newdailyreturn)
#length(AMZN[,1])
#######################################################################
newdailyreturn2=c(newdailyreturn)
#head(newdailyreturn2)
returnwithdate= cbind(AMZN[,1],newdailyreturn2)
#tail(returnwithdate)
#head(returnwithdate)
# print(returnwithdate[,2])
#tail(returnwithdate[,2])
print("ss.1 column represents the holding value of the portfolio")
[1] "ss.1 column represents the holding value of the portfolio"
returnwithdate
GMT
AMZN.Open SS.1
2014-01-02 398.80 99.83901
2014-01-03 398.29 101.30262
2014-01-06 395.85 102.62884
2014-01-07 395.04 102.46624
2014-01-08 398.47 103.18915
2014-01-09 403.71 103.17600
2014-01-10 402.53 100.95463
2014-01-13 397.98 102.87094
2014-01-14 392.13 102.84933
2014-01-15 398.94 102.10209
2014-01-16 393.68 101.91754
2014-01-17 394.26 103.64125
2014-01-21 403.00 102.53339
2014-01-22 408.00 101.56272
2014-01-23 401.00 98.66167
2014-01-24 398.16 98.21961
2014-01-27 390.50 99.40708
2014-01-28 387.40 97.57683
2014-01-29 392.16 103.58041
2014-01-30 393.77 102.52654
2014-01-31 371.76 100.38556
2014-02-03 358.98 101.49730
2014-02-04 349.59 101.10384
2014-02-05 346.00 102.07947
2014-02-06 347.40 100.65346
2014-02-07 358.98 99.91535
2014-02-10 361.61 101.09760
2014-02-11 361.84 99.89278
2014-02-12 356.43 102.03801
2014-02-13 347.70 102.64373
2014-02-14 359.34 102.40720
2014-02-18 355.28 102.10368
2014-02-19 352.64 103.33227
2014-02-20 348.80 102.44620
2014-02-21 352.44 104.65663
2014-02-24 345.19 104.21698
2014-02-25 353.00 103.93542
2014-02-26 359.86 103.74866
2014-02-27 357.22 104.35682
2014-02-28 360.60 103.06916
2014-03-03 358.74 104.60608
2014-03-04 363.90 106.38755
2014-03-05 364.13 105.20581
2014-03-06 374.05 104.66683
2014-03-07 374.58 106.28163
2014-03-10 372.69 105.30136
2014-03-11 370.99 105.63416
2014-03-12 366.40 103.72777
2014-03-13 376.62 102.55897
2014-03-14 372.80 103.70142
2014-03-17 375.72 104.10021
2014-03-18 377.32 104.18329
2014-03-19 378.77 104.28609
2014-03-20 370.64 103.96187
2014-03-21 371.00 101.32948
2014-03-24 360.09 101.81212
2014-03-25 354.03 98.32478
2014-03-26 357.13 97.51387
2014-03-27 343.15 97.58487
2014-03-28 340.05 99.23006
2014-03-31 342.40 100.67596
2014-04-01 338.09 100.43989
2014-04-02 345.99 98.36953
2014-04-03 341.82 95.64622
2014-04-04 335.15 95.31309
2014-04-07 320.99 96.88087
2014-04-08 321.88 99.74062
2014-04-09 328.47 96.12147
2014-04-10 330.60 94.80340
2014-04-11 314.00 95.33169
2014-04-14 317.67 95.37899
2014-04-15 316.70 96.07128
2014-04-16 321.17 95.22272
2014-04-17 319.76 97.11714
2014-04-21 323.97 98.38302
2014-04-22 332.00 97.42753
2014-04-23 333.06 98.42860
2014-04-24 329.67 95.05403
2014-04-25 316.25 93.51827
2014-04-28 304.00 94.87603
2014-04-29 296.44 96.82243
2014-04-30 298.10 98.47057
2014-05-01 304.13 98.19423
2014-05-02 310.42 99.01459
2014-05-05 306.37 96.61136
2014-05-06 309.53 96.13950
2014-05-07 295.56 96.05353
2014-05-08 290.82 96.91111
2014-05-09 290.57 99.73289
2014-05-12 294.30 99.72130
2014-05-13 302.60 98.92365
2014-05-14 302.50 97.54376
2014-05-15 298.02 97.89226
2014-05-16 292.80 99.01216
2014-05-19 295.76 98.58482
2014-05-20 297.10 100.10977
2014-05-21 302.21 100.02679
2014-05-22 305.05 101.00308
2014-05-23 305.46 102.01303
2014-05-27 314.41 102.18201
...
[ reached getRmetricsOption('max.print') | getOption('max.print') -- omitted 1117 rows ]]
- Calculate the CAL equation and graph CAL and the efficient frontier.
#Calculating portfolio variance:
#https://zerodha.com/varsity/chapter/risk-part-4-correlation-matrix-portfolio-variance/
#Portfolio Variance = Sqrt (Transpose (Wt.SD) * Correlation Matrix * Wt. SD
#Calculate the standard deviation of the five assets' returns:
sd_rAMZN <- sd(rAMZN)
sd_rFB <- sd(rFB)
sd_rPG <- sd(rPG)
sd_rCOST <- sd(rCOST)
sd_rCI <- sd(rCI)
sd_matrix <- matrix(c(sd_rAMZN, sd_rFB, sd_rPG, sd_rCOST, sd_rCI))
range.names = c("AMZN", "FB", "PG", "COST", "CI")
cat("Standard Deviations")
Standard Deviations
dimnames(sd_matrix) = list(range.names)
sd_matrix
[,1]
AMZN 0.07515593
FB 0.05422324
PG 0.03537648
COST 0.04786995
CI 0.06180077
#Calculate weighted standard deviations
weighted_sd_matrix <- matrix(c(sd_rAMZN*optimalweight_matrix[1,1], sd_rFB*optimalweight_matrix[2,1], sd_rPG*optimalweight_matrix[3,1], sd_rCOST*optimalweight_matrix[4,1], sd_rCI*optimalweight_matrix[5,1]))
range.names = c("AMZN", "FB", "PG", "COST", "CI")
cat("Weighted Standard Deviations")
Weighted Standard Deviations
dimnames(weighted_sd_matrix) = list(range.names)
weighted_sd_matrix
[,1]
AMZN 0.008964656
FB 0.020963438
PG 0.000126609
COST 0.008132532
CI 0.019815722
#Compute the portfolio variance, when optimal wieghts are used, using this formula: "Portfolio Variance = Sqrt (Transpose (Wt.SD) * Correlation Matrix * Wt. SD"
Portfolio_Variance <- sqrt(t(weighted_sd_matrix)%*%cor_matrix%*%weighted_sd_matrix)
Portfolio_Variance
[,1]
[1,] 0.0328645
Portfolio_SD <- sqrt(Portfolio_Variance)
Portfolio_SD
[,1]
[1,] 0.1812857
#Mean return of optimal portfolio, using monthly returns:
return_optimal_portfolio_mean = optimalweight_matrix[1,1]*mean_rAMZN + optimalweight_matrix[2,1]*mean_rFB + optimalweight_matrix[3,1]*mean_rPG + optimalweight_matrix[4,1]*mean_rCOST + optimalweight_matrix[5,1]*mean_rCI
return_optimal_portfolio_mean
AMZN
0.02036808
#Calculate the sharpe ratio:
sharpe_ratio <- (return_optimal_portfolio_mean - Rf)/(Portfolio_SD)
print(sharpe_ratio)
[,1]
[1,] 0.1023876
#Put it all together to create the CAL:
cat("The capital allocation line:", "E(r) =" , Rf,"+", sharpe_ratio, "* Standard Deviation")
The capital allocation line: E(r) = 0.001806667 + 0.1023876 * Standard Deviation
#Now graph the CAL:
#Create discrete deviations for plotting purposes
basic_standard_deviation <- c(0,1,2,3)
rCAL <- Rf + sharpe_ratio*basic_standard_deviation
Recycling array of length 1 in array-vector arithmetic is deprecated.
Use c() or as.vector() instead.
plot(basic_standard_deviation, rCAL, col="Green", xlab="Standard Deviation", ylab="Expected Return", type="l")

#Plot Portfolio possibilities curve (efficient frontier):
rP = mean_rAMZN + mean_rFB + mean_rPG + mean_rCOST + mean_rCI
- Estimate the CAPM model of your portfolio using 1/2/2018-10/30/2018 data. Compare the estimated beta of the your CAPM model with market beta. Are they statistically different from each other?
*you are doing a regression of the risk premium of the portfolio to the risk premium of the market
riskprem_SPY_CAPM <- rSPY_CAPM - rF_CAPM
longer object length is not a multiple of shorter object length
- Graph the SML and compare the estimated Beta of the CAPM and the average return of your portfolio as a point relative to SML. Comment on performance of your portfolio.
#Graph the SML by calculating the average rf and mrp using the actual data.
#This method uses the average data to get the SML, but we should use the regression model to graph the CAPM
cat("The CAPM Formula is: ", mean(rTNX_CAPM), " + beta * ", mean(riskprem_SPY_CAPM))
The CAPM Formula is: 0.001797593 + beta * -0.001823117
SML_MRP = mean(rSPY_CAPM) - mean(rTNX_CAPM)
SML_MRP
[1] -0.001823762
beta_range = c(0,1,2,3,4,5)
SML_Line = mean(rTNX_CAPM) + beta_range*mean(riskprem_SPY_CAPM)
#This is the CAPM estimate of the optimal portfolios return
SML_Portfolio = mean(rTNX_CAPM) + Beta_Portfolio*mean(riskprem_SPY_CAPM)
plot(beta_range, SML_Line, col="Green", xlab="Beta", ylab="Expected Return", type="p")
#This is the CAPM estimate of the optimal portfolios return graphed
points(Beta_Portfolio, SML_Portfolio, type = "p")
#This is the actual return of the optimal portfolio graphed with the regression estimate of the optimal portfolios beta coefficient
points(Beta_Portfolio, mean(rP_CAPM), col="Red")

cat("The red dot indicates the actual return of the optimal portfolio graphed with the regression estimate of the portfolio's beta coefficient", "The black dot represents the CAPM estimate of the portfolios return graphed with the same beta estimate", "The actual portfolio rests below the SML. This indicates that the portfolio is overvalued. That is, the portfolio is receiving a lesser return for the same amount of risk. Based on CAPM theory, demand for the portfolio should decline, resulting in a lower price of the portfolios underlying returns. As a result, the return of the portfolio would increase until the portfolios point rests on the SML.")
The red dot indicates the actual return of the optimal portfolio graphed with the regression estimate of the portfolio's beta coefficient The black dot represents the CAPM estimate of the portfolios return graphed with the same beta estimate The actual portfolio rests below the SML. This indicates that the portfolio is overvalued. That is, the portfolio is receiving a lesser return for the same amount of risk. Based on CAPM theory, demand for the portfolio should decline, resulting in a lower price of the portfolios underlying returns. As a result, the return of the portfolio would increase until the portfolios point rests on the SML.
- Calculate CV, Sharpe, Treynor, and Sortino ratios for your portfolio and compare them to a similarly diversified portfolio of Vanguard, Fidelity, or any other similar portfolio.
library("PerformanceAnalytics")
Package PerformanceAnalytics (1.5.2) loaded.
Copyright (c) 2004-2018 Peter Carl and Brian G. Peterson, GPL-2 | GPL-3
https://github.com/braverock/PerformanceAnalytics
Attaching package: ‘PerformanceAnalytics’
The following objects are masked from ‘package:timeDate’:
kurtosis, skewness
The following object is masked from ‘package:graphics’:
legend
#Calculate the sharpe ratio:
sharpe_ratio <- (return_optimal_portfolio_mean - Rf)/(Portfolio_SD)
print(sharpe_ratio)
[,1]
[1,] 0.1023876
cat("The sharpe ratio is:", sharpe_ratio, " ")
The sharpe ratio is: 0.1023876
#Calculate Sortino Ratio
#http://braverock.com/brian/R/PerformanceAnalytics/html/SortinoRatio.html
#get monthly optimal returns to the portfolio
return_optimal_portfolio_monthly = optimalweight_matrix[1,1]*rAMZN + optimalweight_matrix[2,1]*rFB + optimalweight_matrix[3,1]*rPG + optimalweight_matrix[4,1]*rCOST + optimalweight_matrix[5,1]*rCI
sortino <- (SortinoRatio(return_optimal_portfolio_monthly, MAR = 0))
cat("The sortino ratio is:", sortino, " " )
The sortino ratio is: 1.605637
#treynor ratio = (rP - rF)/betaP
#Calculate Beta of the Portfolio
#remember beta measure volatility relative to the market. So FB is theoretically 30% less volatile than the market
Beta_AMZN <- 1.87
Beta_FB <- 0.70
Beta_PG <- 0.32
Beta_COST <- 1.17
Beta_CI <- 0.79
Weighted_Beta_Portfolio <- optimalweight_matrix[1,1]*Beta_AMZN + optimalweight_matrix[2,1]*Beta_FB + optimalweight_matrix[3,1]*Beta_PG + optimalweight_matrix[4,1]*Beta_COST + optimalweight_matrix[5,1]*Beta_CI
cat("The Beta of the Portfolio is:", Weighted_Beta_Portfolio, ". Thus,the portolio's returns are theoretically 17% more volatile than the market. ")
The Beta of the Portfolio is: 0.9469034 . Thus,the portolio's returns are theoretically 17% more volatile than the market.
treynor <- ((return_optimal_portfolio_mean-Rf)/Weighted_Beta_Portfolio)
cat("The treynor ratio is:", treynor, " ")
The treynor ratio is: 0.01960222
- Calculate 2% VaR as a percentage of the mean return of your portfolio when the risk horizon is one day and one month.
#Reimport data for intuitiveness:
YahooData <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI","^TNX","SPY"),.GlobalEnv, from = "2014-01-01", to= "2017-12-01", periodicity="monthly", return.class = "timeSeries")
pausing 1 second between requests for more than 5 symbols
pausing 1 second between requests for more than 5 symbols
pausing 1 second between requests for more than 5 symbols
#Calculate Stock Returns and Risk Premiums (Stock Return - Rf); Rf is rTNX
rAMZN <- diff(log(AMZN$AMZN.Adjusted))
rFB <- diff(log(FB$FB.Adjusted))
rPG <- diff(log(PG$PG.Adjusted))
rCOST <- diff(log(COST$COST.Adjusted))
rCI <- diff(log(CI$CI.Adjusted))
rTNX <- TNX$TNX.Adjusted/100/12
#override TNX, start at index two and go down from there, remember when calculating returns for AAPL in excel you got rid of the first value, same thing here
rTNX <- rTNX[2:length(rTNX)]
rSPY <- diff(log(SPY$SPY.Adjusted))
cat("From Question 2: The optimal weights of the portfolio:")
From Question 2: The optimal weights of the portfolio:
print(optimalweight_matrix)
[,1]
AMZN 0.119280757
FB 0.386613531
PG 0.003578903
COST 0.169888036
CI 0.320638772
#Derive the monthly returns and monthly standard defivation for the portfolio:
return_optimal_portfolio_monthly = optimalweight_matrix[1,1]*rAMZN + optimalweight_matrix[2,1]*rFB + optimalweight_matrix[3,1]*rPG + optimalweight_matrix[4,1]*rCOST + optimalweight_matrix[5,1]*rCI
return_optimal_portfolio_monthly
[1] 1.662481e-02 -4.905518e-02 -2.320710e-02 6.264793e-02 3.509477e-02 2.183685e-02 4.259766e-02 7.565185e-03
[9] 1.388802e-02 4.749194e-02 -8.730609e-03 1.846446e-02 6.991908e-02 4.396754e-02 -2.349331e-02 4.319699e-02
[17] 6.788134e-02 3.536462e-02 -3.718295e-02 -6.992076e-03 8.578983e-02 2.141323e-02 3.015053e-02 -3.025680e-02
[25] -1.304242e-02 3.709029e-02 1.669268e-02 -8.854597e-03 -7.171281e-03 5.149245e-02 1.417516e-03 1.197530e-02
[33] -3.381541e-02 -2.395472e-03 -1.594587e-06 9.001858e-02 3.744152e-02 9.679979e-03 5.734957e-02 2.439250e-02
[41] -5.745289e-03 5.681409e-02 1.880125e-02 1.211983e-02 5.051999e-02 4.717530e-02
#Monthly values:
monthly_return_portfolio <- mean(return_optimal_portfolio_monthly)
monthly_sd_portfolio <- sd(return_optimal_portfolio_monthly)
#Annual values:
annual_return_portfolio <- mean(return_optimal_portfolio_monthly)*(12)
annual_SD_portfolio <- sd(return_optimal_portfolio_monthly)*sqrt(12)
#10 day values (250 trading days):
tenday_return_portfolio <- annual_return_portfolio*(10/250)
tenday_sd_portfolio <- annual_SD_portfolio*sqrt(10/250)
#Derive mean monthly returns and monthly sd to the market (SPY):
#Monthly values:
monthly_return_SPY <- mean(rSPY)
monthly_sd_SPY <- sd(rSPY)
#Annual values:
annual_return_SPY <- mean(rSPY)*(12)
annual_SD_SPY <- sd(rSPY)*sqrt(12)
#10 day values (250 trading days):
tenday_return_SPY <- annual_return_SPY*(10/250)
tenday_sd_SPY <- annual_SD_SPY*sqrt(10/250)
#need a function that gives inverse of normal cumulative distributio. pnorm gives CDF and qnorm gives the inverse CDF
#Calculate Mothly VaR for the Market (SPY) and the optimal portfolio
#2% VaR for Optimal Portfolio with monthly time horizon
cat(" 2% VaR for Optimal Portfolio with monthly time horizon is: ",
qnorm(.02,monthly_return_portfolio,monthly_sd_portfolio))
2% VaR for Optimal Portfolio with monthly time horizon is: -0.04712735
cat("
")
#2% VaR for Optimal Portfolio with 10 day time horizon
cat("2% VaR for Optimal Portfolio with 10 day time horizon is:",
qnorm(.02,tenday_return_portfolio,tenday_sd_portfolio))
2% VaR for Optimal Portfolio with 10 day time horizon is: -0.03698553
- Using the CAPM equation of your portfolio do a five periods ex-post forecasting of the returns to your portfolio and compare your forecast to the actual returns. Find and report MAD, MAP, MASE, and RMS for your forecast.
AND
- Using the CAPM equation of your portfolio do a five periods ex-ante forecasting of the returns to your portfolio. Find and report MAD, MAP, MASE, and RMS of your forecast. You may use ES to forecast the risk premium of S&P500 for the required five periods.
#First, put your x and y into a data frame to simplify the forecasting code
question_9_data_Part1 <- data.frame(riskprem_portfolio_CAPM[1:203], riskprem_SPY_CAPM[1:203])
question_9_data_Part2 <- data.frame(riskprem_portfolio_CAPM[204:208], riskprem_SPY_CAPM[204:208])
question_9_data_Fullrange <- data.frame(riskprem_portfolio_CAPM, riskprem_SPY_CAPM)
############################################################################################
#Run the regression for ex-post forecast
reg_expost <- lm(riskprem_portfolio_CAPM ~ riskprem_SPY_CAPM, data=question_9_data_Part1)
#Ex-post forecast
pred <- predict(reg, newdata=question_9_data_Part2, se.fit=TRUE)
Error in predict(reg, newdata = question_9_data_Part2, se.fit = TRUE) :
object 'reg' not found
- Do a Naïve, MA3, MA5, WMA5, and ES of the returns to your portfolio for the period 10/30/ 2018 on. Find MAD, MAPE, MASE and RMS of your forecasts. Compare the forecasting efficiency criterion of your CAPM with smoothing techniques. Which one results in a better forecasting outcome?
library("fPortfolio")
library("quantmod")
library("timeSeries")
library("tseries")
library("stats")
#Import daily stock adj closing prices from yahoo
YahooData_Daily <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI", "SPY", "^TNX"),.GlobalEnv, from = "2018-10-30", to= Sys.Date(), periodicity="daily", return.class = "timeSeries")
#Calculate Daily Adjusted Returns
#Note, since day 1 you have $100, and it isn't affected by the return of the previous day, left out the first day of the returns when importing data)
rAMZN_smoothing <- diff(log(AMZN$AMZN.Adjusted))
rFB_smoothing <- diff(log(FB$FB.Adjusted))
rPG_smoothing <- diff(log(PG$PG.Adjusted))
rCOST_smoothing <- diff(log(COST$COST.Adjusted))
rCI_smoothing <- diff(log(CI$CI.Adjusted))
rTNX_smoothing <- TNX$TNX.Adjusted/100/12
#override TNX, start at index two and go down from there, remember when calculating returns for AAPL in excel you got rid of the first value, same thing here
rTNX_smoothing <- rTNX[2:length(rTNX)]
rSPY_smoothing <- diff(log(SPY$SPY.Adjusted))
(rF_smoothing <- rTNX_smoothing)
#Get daily returns of your portfolio for this date range:
rP_smoothing <- optimalweight_matrix[1,1]*rAMZN_smoothing + optimalweight_matrix[2,1]*rFB_smoothing + optimalweight_matrix[3,1]*rPG_smoothing + optimalweight_matrix[4,1]*rCOST_smoothing + optimalweight_matrix[5,1]*rCI_smoothing
rP_smoothing
#Naive Forecast:
library(forecast)
Naive_forecast <- plot(snaive(rP_smoothing,2))
snaive(rP_smoothing,2)
accuracy(snaive(rP_smoothing,2))
#MA3 Forecast
library(forecast)
ma3 <- ma(rP_smoothing, order=2)
ma3
plot(rP_smoothing)
lines(ma(rP_smoothing, order=2), col="red")
#Do we need to do this way or harsh's way?
accuracy(ma3, rP_smoothing)
#MA5 Forecast
ma5 <- ma(rP_smoothing, order=5)
plot(rP_smoothing)
lines(ma(rP_smoothing, order=5), col="red")
accuracy(ma5, rP_smoothing)
#ES - Expontential Smoothing
#Alpha is the dampenining parameter
fit1 <- ses(rP_smoothing, alpha=0.2, initial="simple", h=3)
fit2 <- ses(rP_smoothing, alpha=0.6, initial="simple", h=3)
fit3 <- ses(rP_smoothing, h=3)
plot(fit1, main="", fcol="white", type="o")
lines(fitted(fit1), col="blue", type="o")
lines(fitted(fit2), col="red", type="o")
lines(fitted(fit3), col="green", type="o")
lines(fit1$mean, col="blue", type="o")
lines(fit2$mean, col="red", type="o")
lines(fit3$mean, col="green", type="o")
legend("topleft",lty=1, col=c(1,"blue","red","green"),
c("data", expression(alpha == 0.2), expression(alpha == 0.6),
expression(alpha == 0.89)),pch=1)
#Accuracy Measures to get MAD MASE, etc.
accuracy(fit1)
accuracy(fit2)
accuracy(fit3)
#Compare the accuracy of all the forecasting models
#CAPM_regression error
accuracy(CAPM_regression)
#Error in Naive Forecasting Model
print("Naive Forecasting Model")
accuracy(snaive(rP_smoothing,3))
#Error in MA3 Forecasting Model
print("MA3 Forecasting Model")
accuracy(ma3, rP_smoothing)
#Error in MA5 Forecasting Model
print("MA5 Forecasting Model")
accuracy(ma5, rP_smoothing)
#Error in Exponential Smoothing Forecast Model
print("Exponential Smoothing Forecast Model")
accuracy(fit1)
accuracy(fit2)
accuracy(fit3)
#cat("
#","The forecasting models have different error levels. It appears that the MA3 model has to smallest RMSE")
#Compare the accuracy of all the forecasting models
#CAPM_regression error
print("CAPM Model")
accuracy(CAPM_regression)
#CAPM Ex-post forecast error
accuracy(reg_expost)
#Error in Naive Forecasting Model
print("Naive Forecasting Model")
accuracy(snaive(rP_smoothing,3))
#Error in MA3 Forecasting Model
print("MA3 Forecasting Model")
accuracy(ma3, rP_smoothing)
#Error in MA5 Forecasting Model
print("MA5 Forecasting Model")
accuracy(ma5, rP_smoothing)
#Error in Exponential Smoothing Forecast Model
print("Exponential Smoothing Forecast Model")
accuracy(fit1)
accuracy(fit2)
accuracy(fit3)
#cat("
#","The forecasting models have different error levels. It appears that the MA3 model has to smallest RMSE")
---
title: "FBE 506B Semester Project - DRAFT 2018-10-18 - positive risk premium edit"
output:
  html_notebook: default
  word_document: default
---

---
title: "FBE 506B Semester Project - DRAFT 2018-10-15"
output: html_notebook
---

Using monthly data from January 2014M1 to 2017M12 estimate the followings:
1. Select at least five stocks from different industries (for the list of the firms in different industries see, https://biz.yahoo.com/p/sum_conameu.html).

```{r}

#QC'd 


###The original stocks significantly underperformed the risk free rate. So, found a hnadful of stocks with returns close to or above the risk free rate so don't have to deal with a negative sharpe ratio###  

#New Stocks for Portfolio
#Amazon.com, Inc. (AMZN)- Speciality Retail 
#Facebook, Inc. (FB) - Internet Content & Information 
#The Procter & Gamble Company (PG) - Household & Personal Products  
#Costco Wholesale Corporation (COST) - Discount Stores  
#Cigna Corporation (CI) - Health Care Plans

#Clean Environment
rm(list=ls(all=TRUE))
cat("\014")

library("fPortfolio")
library("quantmod")
library("timeSeries")
library("tseries")
library("stats")


#Import stock data from yahoo (see Q6 assignment 1)
#to=Sys.Date()
#make sure 12-02 so that the data includes the month of 12/2017, 12/01 excludes 12/2017
YahooData <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI","^TNX","SPY"),.GlobalEnv, from = "2014-01-01", to= "2017-12-02", periodicity="monthly", return.class = "timeSeries")

```


2. Construct a portfolio of the selected stocks and graph the efficient frontier.

  2a. Find the optimum weights using MPT.

```{r}
#QC: need to find efficient frontier, did everyone else get .0018 as RF? and .008 as the market risk premium? 


#Calculate Stock Returns and Risk Premiums (Stock Return - Rf); Rf is rTNX 
rAMZN <- diff(log(AMZN$AMZN.Adjusted))
rFB <- diff(log(FB$FB.Adjusted))
rPG <- diff(log(PG$PG.Adjusted))
rCOST <- diff(log(COST$COST.Adjusted))
rCI <- diff(log(CI$CI.Adjusted))
rTNX <- TNX$TNX.Adjusted/100/12
#override TNX, start at index two and go down from there, remember when calculating returns for AAPL in excel you got rid of the first value, same thing here  
rTNX <- rTNX[2:length(rTNX)]
rSPY <- diff(log(SPY$SPY.Adjusted))


#Find the mean returns of each stock and the risk premium 
mean_rAMZN <- mean(rAMZN)
mean_rFB <- mean(rFB)
mean_rPG <- mean(rPG)
mean_rCOST <- mean(rCOST)
mean_rCI <- mean(rCI)
Rm <- mean(rSPY)
Rf <- mean(rTNX)
Market_RiskPrem <- Rm - Rf 
premAMZN <- mean_rAMZN- Rf
premFB <- mean_rFB- Rf
premPG <- mean_rPG - Rf
premCOST <- mean_rCOST - Rf
premCI <- mean_rCI - Rf

#Create a covariance matrix from which you can build out the efficient frontier:
#https://www.youtube.com/watch?v=hqQVYlq1nmk


portfolio <- data.frame(rAMZN, rFB, rPG,rCOST,rCI)
range.names = c("AMZN", "FB", "PG", "COST", "CI")
names(portfolio) = range.names
covmatrix = matrix(c(cov(portfolio)), nrow= 5, ncol=5)
covmatrix
dimnames(covmatrix) = list(range.names, range.names)
inverse_covmatrix <- solve(covmatrix)
inverse_covmatrix

#Convert to correlation matrix to confirm numbers line up
cor_matrix <- cov2cor(covmatrix)



#Create Risk Premium Vector, NOTE: the order of elements in the vector = order of elements in cov matrix 

risk_premvector <- matrix(c(premAMZN, premFB, premPG, premCOST, premCI), nrow=5,ncol=1)
risk_premvector


#Multiply inverse cov matrix by risk premium vector to get unstandardizd optimal weights of the portfolio: 

unstandardized_weights <- inverse_covmatrix %*% risk_premvector
unstandardized_weights 
#Add all elements in the unstandardized weight vector

colSums(unstandardized_weights)

#Now calculate optimal weights
w_AMZN <- unstandardized_weights[1,1] / colSums(unstandardized_weights)
w_FB <- unstandardized_weights[2,1] / colSums(unstandardized_weights)
w_PG <- unstandardized_weights[3,1] / colSums(unstandardized_weights)
w_COST <- unstandardized_weights[4,1] / colSums(unstandardized_weights)
w_CI <- unstandardized_weights[5,1] / colSums(unstandardized_weights)
optimalweight_matrix <- matrix(c(w_AMZN, w_FB, w_PG, w_COST, w_CI), nrow=5, ncol=1)
range.names = c("AMZN", "FB", "PG", "COST", "CI")
dimnames(optimalweight_matrix) = list(range.names)


cat("The optimal weights of the portfolio:")
print(optimalweight_matrix)

#Test that all weights add to 1: 
#cat("Test that all weights add to 1:")
#print(colSums(optimalweight_matrix))

```

  2b. and 2c. Using the optimum weights and daily adjusted closing prices at the end of 2017 allocate $100.00            among among the selected stocks. On 1/1/2014, the portfolio will have a value of 100 as an index.  

```{r}

#Import daily stock adj closing prices from yahoo 
YahooData_Daily <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI"),.GlobalEnv, from = "2014-01-02", to = "2018-10-31", periodicity="daily", return.class = "timeSeries")

#Calculate Daily Adjusted Returns 
#Note, since day 1 you have $100, and it isn't affected by the return of the previous day, left out the first day of the returns when importing data)

daily_rAMZN <- diff(log(AMZN$AMZN.Adjusted)) 
daily_rFB <- diff(log(FB$FB.Adjusted))
daily_rPG <- diff(log(PG$PG.Adjusted))
daily_rCOST <- diff(log(COST$COST.Adjusted))
daily_rCI <- diff(log(CI$CI.Adjusted))



#Create equation for daily optimal returns of the portfolio

return_optimal_portfolio_daily = optimalweight_matrix[1,1]*daily_rAMZN + optimalweight_matrix[2,1]*daily_rFB + optimalweight_matrix[3,1]*daily_rPG + optimalweight_matrix[4,1]*daily_rCOST + optimalweight_matrix[5,1]*daily_rCI 
mean_return <- mean(return_optimal_portfolio_daily)*252*4

# round(return_optimal_portfolio_daily,5)
# 100*(1+return_optimal_portfolio_daily[1])*(1+return_optimal_portfolio_daily[2])*(1+return_optimal_portfolio_daily[3])

# class(return_optimal_portfolio_daily)

#Use for loop to generate holding values for every day of the data series:

#######################################################################

newreturn = 1 + return_optimal_portfolio_daily
newreturn[1] <- newreturn[1]*100 #the value of the second day
# head(newreturn)
# tail(newreturn)
newdailyreturn = cumprod(newreturn)
#head(newdailyreturn)
#tail(newdailyreturn)
#length(newdailyreturn)
#length(AMZN[,1])

#######################################################################
newdailyreturn2=c(newdailyreturn)
#head(newdailyreturn2)
returnwithdate= cbind(AMZN[,1],newdailyreturn2)
#tail(returnwithdate)
#head(returnwithdate)
# print(returnwithdate[,2])
#tail(returnwithdate[,2])
print("ss.1 column represents the holding value of the portfolio")
returnwithdate           

```

3. Calculate the CAL equation and graph CAL and the efficient frontier.

```{r}

#Calculating portfolio variance: 
#https://zerodha.com/varsity/chapter/risk-part-4-correlation-matrix-portfolio-variance/

#Portfolio Variance = Sqrt (Transpose (Wt.SD) * Correlation Matrix * Wt. SD

#Calculate the standard deviation of the five assets' returns: 

sd_rAMZN <- sd(rAMZN)
sd_rFB <- sd(rFB)
sd_rPG <- sd(rPG)
sd_rCOST <- sd(rCOST)
sd_rCI <- sd(rCI)
sd_matrix <- matrix(c(sd_rAMZN, sd_rFB, sd_rPG, sd_rCOST, sd_rCI)) 
range.names = c("AMZN", "FB", "PG", "COST", "CI")
cat("Standard Deviations")
dimnames(sd_matrix) = list(range.names)
sd_matrix

#Calculate weighted standard deviations 

weighted_sd_matrix <- matrix(c(sd_rAMZN*optimalweight_matrix[1,1], sd_rFB*optimalweight_matrix[2,1], sd_rPG*optimalweight_matrix[3,1], sd_rCOST*optimalweight_matrix[4,1], sd_rCI*optimalweight_matrix[5,1])) 
range.names = c("AMZN", "FB", "PG", "COST", "CI")
cat("Weighted Standard Deviations")
dimnames(weighted_sd_matrix) = list(range.names)
weighted_sd_matrix

#Compute the portfolio variance, when optimal wieghts are used, using this formula: "Portfolio Variance = Sqrt (Transpose (Wt.SD) * Correlation Matrix * Wt. SD"

Portfolio_Variance <- sqrt(t(weighted_sd_matrix)%*%cor_matrix%*%weighted_sd_matrix)
Portfolio_Variance
Portfolio_SD <- sqrt(Portfolio_Variance)
Portfolio_SD 

#Mean return of optimal portfolio, using monthly returns:

return_optimal_portfolio_mean = optimalweight_matrix[1,1]*mean_rAMZN + optimalweight_matrix[2,1]*mean_rFB + optimalweight_matrix[3,1]*mean_rPG + optimalweight_matrix[4,1]*mean_rCOST + optimalweight_matrix[5,1]*mean_rCI
return_optimal_portfolio_mean


#Calculate the sharpe ratio: 

sharpe_ratio <- (return_optimal_portfolio_mean - Rf)/(Portfolio_SD)
print(sharpe_ratio)

#Put it all together to create the CAL: 

cat("The capital allocation line:", "E(r) =" , Rf,"+", sharpe_ratio, "* Standard Deviation") 

#Now graph the CAL: 

#Create discrete deviations for plotting purposes
basic_standard_deviation <- c(0,1,2,3)
rCAL <- Rf + sharpe_ratio*basic_standard_deviation
plot(basic_standard_deviation, rCAL, col="Green", xlab="Standard Deviation", ylab="Expected Return", type="l")

#Plot Portfolio possibilities curve (efficient frontier):

rP = mean_rAMZN + mean_rFB + mean_rPG + mean_rCOST + mean_rCI



```


4. Estimate the CAPM model of your portfolio using 1/2/2018-10/30/2018 data.  Compare the estimated beta of the your CAPM model with market beta. Are they statistically different from each other? 


*you are doing a regression of the risk premium of the portfolio to the risk premium of the market 

```{r}

library("fPortfolio")
library("quantmod")
library("timeSeries")
library("tseries")
library("stats")

#Import daily stock adj closing prices from yahoo 
YahooData_Daily <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI", "SPY", "^TNX"),.GlobalEnv, from = "2018-01-02", to="2018-10-30", periodicity="daily", return.class = "timeSeries")

#Calculate Daily Adjusted Returns 
#Note, since day 1 you have $100, and it isn't affected by the return of the previous day, left out the first day of the returns when importing data)

rAMZN_CAPM <- diff(log(AMZN$AMZN.Adjusted))  
rFB_CAPM <- diff(log(FB$FB.Adjusted))
rPG_CAPM <- diff(log(PG$PG.Adjusted))
rCOST_CAPM <- diff(log(COST$COST.Adjusted))
rCI_CAPM <- diff(log(CI$CI.Adjusted))
rTNX_CAPM <- TNX$TNX.Adjusted/100/12
#override TNX, start at index two and go down from there, remember when calculating returns for AAPL in excel you got rid of the first value, same thing here
rTNX_CAPM <- rTNX[2:length(rTNX)]
rSPY_CAPM <- diff(log(SPY$SPY.Adjusted))
(rF_CAPM <- rTNX_CAPM)


#This is the actual return to the portfolio
rP_CAPM <- optimalweight_matrix[1,1]*rAMZN_CAPM + optimalweight_matrix[2,1]*rFB_CAPM + optimalweight_matrix[3,1]*rPG_CAPM + optimalweight_matrix[4,1]*rCOST_CAPM + optimalweight_matrix[5,1]*rCI_CAPM
rP_CAPM

riskprem_portfolio_CAPM <- rP_CAPM - rF_CAPM

#risk premium of SPY is the market risk premium 
riskprem_SPY_CAPM <- rSPY_CAPM - rF_CAPM


#Now that you have your independent and dependent variables (x=risk premiun market, y= risk premium of the portfolio), regress the data to find the beta estimate for your portfolio: 

CAPM_regression <- lm(riskprem_portfolio_CAPM ~ riskprem_SPY_CAPM)
summary(CAPM_regression)

#Summary notes of the regression show that the alpha and beta of CAPM are:
Alpha <-  -0.000806
Beta_Portfolio <- 0.527691

cat("The CAPM Formula is: ", mean(rTNX_CAPM), " + beta * ", mean(riskprem_SPY_CAPM))


#Test that the Beta of the portfolio is not statistically different that the beta (1) of the market
Beta_Market <- 1
SE_Beta_Portfolio <- 0.063053

cat( "Calculate the t statistic to test the null hypothesis that Beta of the portfolio is not statistically different than beta of the market") 

tstat <- (Beta_Portfolio-Beta_Market)/(SE_Beta_Portfolio)
tstat

cat("The t-stat is", tstat, "    ")

#Ho: Beta_Portfolio = 1
#Ha: B_Portfolio != 1 

cat("Since summary regression shows t-value of beta1 is 7.49 > 1.96, reject the null hypothesis, thus, Beta of the portfolio is statistically different than the Beta of the market")

```
5.  Graph the SML and compare the estimated Beta of the CAPM and the average return of your portfolio as a point relative to SML. Comment on performance of your portfolio.

```{r}

#Graph the SML by calculating the average rf and mrp using the actual data. 



#This method uses the average data to get the SML, but we should use the regression model to graph the CAPM

cat("The CAPM Formula is: ", mean(rTNX_CAPM), " + beta * ", mean(riskprem_SPY_CAPM))

SML_MRP = mean(rSPY_CAPM) - mean(rTNX_CAPM)
SML_MRP
beta_range = c(0,1,2,3,4,5) 
SML_Line = mean(rTNX_CAPM) + beta_range*mean(riskprem_SPY_CAPM)
#This is the CAPM estimate of the optimal portfolios return
SML_Portfolio = mean(rTNX_CAPM) + Beta_Portfolio*mean(riskprem_SPY_CAPM)
plot(beta_range, SML_Line, col="Green", xlab="Beta", ylab="Expected Return", type="p")
#This is the CAPM estimate of the optimal portfolios return graphed
points(Beta_Portfolio, SML_Portfolio, type = "p")
#This is the actual return of the optimal portfolio graphed with the regression estimate of the optimal portfolios beta coefficient
points(Beta_Portfolio, mean(rP_CAPM), col="Red")

cat("The red dot indicates the actual return of the optimal portfolio graphed with the regression estimate of the portfolio's beta coefficient", "The black dot represents the CAPM estimate of the portfolios return graphed with the same beta estimate", "The actual portfolio rests below the SML. This indicates that the portfolio is overvalued. That is, the portfolio is receiving a lesser return for the same amount of risk. Based on CAPM theory, demand for the portfolio should decline, resulting in a lower price of the portfolios underlying returns. As a result, the return of the portfolio would increase until the portfolios point rests on the SML.")

```


6. Calculate CV, Sharpe, Treynor, and Sortino ratios for your portfolio and compare them to a similarly diversified portfolio of Vanguard, Fidelity, or any other similar portfolio.

```{r}

library("PerformanceAnalytics")


#Calculate the sharpe ratio: 

sharpe_ratio <- (return_optimal_portfolio_mean - Rf)/(Portfolio_SD)
print(sharpe_ratio)

cat("The sharpe ratio is:", sharpe_ratio, "     ")

#Calculate Sortino Ratio 
#http://braverock.com/brian/R/PerformanceAnalytics/html/SortinoRatio.html

#get monthly optimal returns to the portfolio

return_optimal_portfolio_monthly = optimalweight_matrix[1,1]*rAMZN + optimalweight_matrix[2,1]*rFB + optimalweight_matrix[3,1]*rPG + optimalweight_matrix[4,1]*rCOST + optimalweight_matrix[5,1]*rCI

 
sortino <- (SortinoRatio(return_optimal_portfolio_monthly, MAR = 0))

cat("The sortino ratio is:", sortino, "     " )

#treynor ratio = (rP - rF)/betaP 

#Calculate Beta of the Portfolio
#remember beta measure volatility relative to the market. So FB is theoretically 30% less volatile than the market 

Beta_AMZN <- 1.87
Beta_FB <- 0.70
Beta_PG <- 0.32
Beta_COST <- 1.17 
Beta_CI <- 0.79
Weighted_Beta_Portfolio <- optimalweight_matrix[1,1]*Beta_AMZN + optimalweight_matrix[2,1]*Beta_FB + optimalweight_matrix[3,1]*Beta_PG + optimalweight_matrix[4,1]*Beta_COST + optimalweight_matrix[5,1]*Beta_CI
cat("The Beta of the Portfolio is:", Weighted_Beta_Portfolio, ". Thus,the portolio's returns are theoretically 17% more volatile than the market.     ")

treynor <- ((return_optimal_portfolio_mean-Rf)/Weighted_Beta_Portfolio)
cat("The treynor ratio is:", treynor, "     ")

```


7. Calculate 2% VaR as a percentage of the mean return of your portfolio when the risk horizon is one day and one month. 

```{r}
#Reimport data for intuitiveness:  

YahooData <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI","^TNX","SPY"),.GlobalEnv, from = "2014-01-01", to= "2017-12-01", periodicity="monthly", return.class = "timeSeries")

#Calculate Stock Returns and Risk Premiums (Stock Return - Rf); Rf is rTNX 
rAMZN <- diff(log(AMZN$AMZN.Adjusted))
rFB <- diff(log(FB$FB.Adjusted))
rPG <- diff(log(PG$PG.Adjusted))
rCOST <- diff(log(COST$COST.Adjusted))
rCI <- diff(log(CI$CI.Adjusted))
rTNX <- TNX$TNX.Adjusted/100/12
#override TNX, start at index two and go down from there, remember when calculating returns for AAPL in excel you got rid of the first value, same thing here  
rTNX <- rTNX[2:length(rTNX)]
rSPY <- diff(log(SPY$SPY.Adjusted))

cat("From Question 2: The optimal weights of the portfolio:")
print(optimalweight_matrix)

#Derive the monthly returns and monthly standard defivation for the portfolio: 

return_optimal_portfolio_monthly = optimalweight_matrix[1,1]*rAMZN + optimalweight_matrix[2,1]*rFB + optimalweight_matrix[3,1]*rPG + optimalweight_matrix[4,1]*rCOST + optimalweight_matrix[5,1]*rCI 
return_optimal_portfolio_monthly

#Monthly values:
monthly_return_portfolio <- mean(return_optimal_portfolio_monthly)
monthly_sd_portfolio <- sd(return_optimal_portfolio_monthly)
#Annual values:
annual_return_portfolio <-   mean(return_optimal_portfolio_monthly)*(12)
annual_SD_portfolio <-  sd(return_optimal_portfolio_monthly)*sqrt(12)
#10 day values (250 trading days): 
tenday_return_portfolio <- annual_return_portfolio*(10/250)
tenday_sd_portfolio <- annual_SD_portfolio*sqrt(10/250)


#Derive mean monthly returns and monthly sd to the market (SPY): 

#Monthly values:
monthly_return_SPY <- mean(rSPY)
monthly_sd_SPY <- sd(rSPY)
#Annual values:
annual_return_SPY <- mean(rSPY)*(12)
annual_SD_SPY <-  sd(rSPY)*sqrt(12)
#10 day values (250 trading days): 
tenday_return_SPY <- annual_return_SPY*(10/250)
tenday_sd_SPY <- annual_SD_SPY*sqrt(10/250)

#need a function that gives inverse of normal cumulative distributio. pnorm gives CDF and qnorm gives the inverse CDF

#Calculate Mothly VaR for the Market (SPY) and the optimal portfolio

#2% VaR for Optimal Portfolio with monthly time horizon 
cat("   2% VaR for Optimal Portfolio with monthly time horizon is: ", 
qnorm(.02,monthly_return_portfolio,monthly_sd_portfolio))

cat("
    ")

#2% VaR for Optimal Portfolio with 10 day time horizon 
cat("2% VaR for Optimal Portfolio with 10 day time horizon is:",
qnorm(.02,tenday_return_portfolio,tenday_sd_portfolio))




```



9.  Using the CAPM equation of your portfolio do a five periods ex-post forecasting of the returns to your portfolio and compare your forecast to the actual returns. Find and report MAD, MAP, MASE, and RMS for your forecast.

AND

10. Using the CAPM equation of your portfolio do a five periods ex-ante forecasting of the returns to your portfolio. Find and report MAD, MAP, MASE, and RMS of your forecast. You may use ES to forecast the risk premium of S&P500 for the required five periods.

```{r}

#First, put your x and y into a data frame to simplify the forecasting code 

question_9_data_Part1 <- data.frame(riskprem_portfolio_CAPM[1:203], riskprem_SPY_CAPM[1:203])
question_9_data_Part2 <- data.frame(riskprem_portfolio_CAPM[204:208], riskprem_SPY_CAPM[204:208])
question_9_data_Fullrange <- data.frame(riskprem_portfolio_CAPM, riskprem_SPY_CAPM)

############################################################################################

#Run the regression for ex-post forecast   
reg_expost <- lm(riskprem_portfolio_CAPM ~ riskprem_SPY_CAPM, data=question_9_data_Part1)
#Ex-post forecast 
pred <- predict(reg, newdata=question_9_data_Part2, se.fit=TRUE) 
pred

plot(riskprem_portfolio_CAPM, type="l", col="red")
lines(reg$fitted.values, col="blue")

accuracy(reg_expost)

############################################################################################

#Run the regression for ex-ante forecast

#For Ex-ante Forecasting Use all the Data in Sample (data) and run the regression
reg_exante <- lm(riskprem_portfolio_CAPM ~ riskprem_SPY_CAPM, data=question_9_data_Fullrange)
#Before Forecasting add "forecast" to the Library then Forecast
library("forecast")
fore_exante <- forecast(reg_exante, newdata=data.frame(question_9_data_Fullrange), se,fit=TRUE)
fore_exante
accuracy(reg_exante)
plot(fore_exante, type="l")
############################################################################################

```


11. Do a Naïve, MA3, MA5, WMA5, and ES of the returns to your portfolio for the period 10/30/ 2018 on. Find MAD, MAPE, MASE and RMS of your forecasts. Compare the forecasting efficiency criterion of your CAPM with smoothing techniques. Which one results in a better forecasting outcome?

```{r}

library("fPortfolio")
library("quantmod")
library("timeSeries")
library("tseries")
library("stats")

#Import daily stock adj closing prices from yahoo 
YahooData_Daily <- getSymbols.yahoo(c("AMZN","FB","PG","COST","CI", "SPY", "^TNX"),.GlobalEnv, from = "2018-10-30", to= Sys.Date(), periodicity="daily", return.class = "timeSeries")

#Calculate Daily Adjusted Returns 
#Note, since day 1 you have $100, and it isn't affected by the return of the previous day, left out the first day of the returns when importing data)

rAMZN_smoothing <- diff(log(AMZN$AMZN.Adjusted))  
rFB_smoothing <- diff(log(FB$FB.Adjusted))
rPG_smoothing <- diff(log(PG$PG.Adjusted))
rCOST_smoothing <- diff(log(COST$COST.Adjusted))
rCI_smoothing <- diff(log(CI$CI.Adjusted))
rTNX_smoothing <- TNX$TNX.Adjusted/100/12
#override TNX, start at index two and go down from there, remember when calculating returns for AAPL in excel you got rid of the first value, same thing here
rTNX_smoothing <- rTNX[2:length(rTNX)]
rSPY_smoothing <- diff(log(SPY$SPY.Adjusted))
(rF_smoothing <- rTNX_smoothing)


#Get daily returns of your portfolio for this date range: 

rP_smoothing <- optimalweight_matrix[1,1]*rAMZN_smoothing + optimalweight_matrix[2,1]*rFB_smoothing + optimalweight_matrix[3,1]*rPG_smoothing + optimalweight_matrix[4,1]*rCOST_smoothing + optimalweight_matrix[5,1]*rCI_smoothing
rP_smoothing

#Naive Forecast: 
library(forecast)
Naive_forecast <- plot(snaive(rP_smoothing,2))
snaive(rP_smoothing,2)
accuracy(snaive(rP_smoothing,2))

#MA3 Forecast 
library(forecast)
ma3 <- ma(rP_smoothing, order=2)
ma3
plot(rP_smoothing)
lines(ma(rP_smoothing, order=2), col="red")
#Do we need to do this way or harsh's way?
accuracy(ma3, rP_smoothing)

#MA5 Forecast 

ma5 <- ma(rP_smoothing, order=5)
plot(rP_smoothing)
lines(ma(rP_smoothing, order=5), col="red")
accuracy(ma5, rP_smoothing)

#ES - Expontential Smoothing 

#Alpha is the dampenining parameter
fit1 <- ses(rP_smoothing, alpha=0.2, initial="simple", h=3)
fit2 <- ses(rP_smoothing, alpha=0.6, initial="simple", h=3)
fit3 <- ses(rP_smoothing, h=3)
plot(fit1, main="", fcol="white", type="o")
lines(fitted(fit1), col="blue", type="o")
lines(fitted(fit2), col="red", type="o")
lines(fitted(fit3), col="green", type="o")
lines(fit1$mean, col="blue", type="o")
lines(fit2$mean, col="red", type="o")
lines(fit3$mean, col="green", type="o")
legend("topleft",lty=1, col=c(1,"blue","red","green"), 
       c("data", expression(alpha == 0.2), expression(alpha == 0.6),
         expression(alpha == 0.89)),pch=1)

#Accuracy Measures to get MAD MASE, etc. 
accuracy(fit1)
accuracy(fit2)
accuracy(fit3)


#Compare the accuracy of all the forecasting models


#CAPM_regression error 

accuracy(CAPM_regression)

#Error in Naive Forecasting Model 
print("Naive Forecasting Model")
accuracy(snaive(rP_smoothing,3))


#Error in MA3 Forecasting Model
print("MA3 Forecasting Model")
accuracy(ma3, rP_smoothing)

#Error in MA5 Forecasting Model 
print("MA5 Forecasting Model")
accuracy(ma5, rP_smoothing)

#Error in Exponential Smoothing Forecast Model 
print("Exponential Smoothing Forecast Model")
accuracy(fit1)
accuracy(fit2)
accuracy(fit3)


#cat("
    #","The forecasting models have different error levels. It appears that the MA3 model has to smallest RMSE")


```


```{r}

#Compare the accuracy of all the forecasting models

#CAPM_regression error 

print("CAPM Model")
accuracy(CAPM_regression)

#CAPM Ex-post forecast error

accuracy(reg_expost)

#Error in Naive Forecasting Model 
print("Naive Forecasting Model")
accuracy(snaive(rP_smoothing,3))


#Error in MA3 Forecasting Model
print("MA3 Forecasting Model")
accuracy(ma3, rP_smoothing)

#Error in MA5 Forecasting Model 
print("MA5 Forecasting Model")
accuracy(ma5, rP_smoothing)

#Error in Exponential Smoothing Forecast Model 
print("Exponential Smoothing Forecast Model")
accuracy(fit1)
accuracy(fit2)
accuracy(fit3)


#cat("
    #","The forecasting models have different error levels. It appears that the MA3 model has to smallest RMSE")

```





