Get access to the Probablity Lab
kobe<-read.csv("C:\\Users\\lizza\\Documents\\CUNY - Data Analytics\\DATA 606 - Probablity and Statistics\\Week 2 Lab\\kobe.csv")
#Use the head function to obtain the first several rows of a data matrix or data frame
head(kobe)
## vs game quarter time
## 1 ORL 1 1 9:47
## 2 ORL 1 1 9:07
## 3 ORL 1 1 8:11
## 4 ORL 1 1 7:41
## 5 ORL 1 1 7:03
## 6 ORL 1 1 6:01
## description basket
## 1 Kobe Bryant makes 4-foot two point shot H
## 2 Kobe Bryant misses jumper M
## 3 Kobe Bryant misses 7-foot jumper M
## 4 Kobe Bryant makes 16-foot jumper (Derek Fisher assists) H
## 5 Kobe Bryant makes driving layup H
## 6 Kobe Bryant misses jumper M
#Sequence of hits and misses from his 9 shot attemtpts in the first quarter
kobe$basket[1:9]
## [1] H M M H H M M M M
## Levels: H M
What does a streak length of 1 mean, i.e. how many hits and misses are in a streak of 1? What about a streak length of 0?
#Received error
#Error in calc_streak(kobe$basket) : could not find function "calc_streak"
#kobe_streak <- calc_streak(kobe$basket)
#barplot(table(kobe_streak))
Describe the distribution of Kobe’s streak lengths from the 2009 NBA finals. What was his typical streak length? How long was his longest streak of baskets?
Simulations in R
#R creates rando numbers to simulate flipping a fair coin
outcomes <-c("heads","tails")
sample(outcomes, size=1, replace=TRUE)
## [1] "heads"
#The vector outcomes can be thought of as a hat with two slips of paper in it: one slip says heads and the other says tails. The function sample draws one slip from the hat and tells us if it was a head or a tail.
#The size argument tells R how many samples to draw
#Replace=TRUE indicates we put the slip of paper back in the hat before drawing again
sim_fair_coin <-sample(outcomes, size=100, replace=TRUE)
sim_fair_coin
## [1] "tails" "tails" "tails" "tails" "heads" "tails" "tails" "tails"
## [9] "heads" "heads" "tails" "heads" "tails" "tails" "tails" "tails"
## [17] "tails" "tails" "tails" "heads" "tails" "heads" "tails" "heads"
## [25] "tails" "tails" "heads" "heads" "tails" "tails" "heads" "heads"
## [33] "tails" "heads" "heads" "heads" "tails" "heads" "heads" "heads"
## [41] "tails" "tails" "tails" "tails" "heads" "tails" "tails" "tails"
## [49] "heads" "tails" "tails" "tails" "tails" "heads" "heads" "tails"
## [57] "heads" "heads" "heads" "tails" "heads" "heads" "heads" "heads"
## [65] "heads" "heads" "tails" "heads" "heads" "tails" "tails" "heads"
## [73] "tails" "heads" "heads" "heads" "tails" "tails" "heads" "heads"
## [81] "tails" "heads" "tails" "tails" "heads" "tails" "heads" "tails"
## [89] "heads" "heads" "tails" "heads" "heads" "tails" "tails" "tails"
## [97] "heads" "tails" "tails" "heads"
table(sim_fair_coin)
## sim_fair_coin
## heads tails
## 47 53
#Say we're trying to simulate an unfair coin that we know only lands heads 20% of the time. We can adjust for this by adding an argument called prob, which provides a vector of two probability weights.
sim_unfair_coin <-sample(outcomes, size=100, replace=TRUE, prob=c(0.2,0.8))
sim_unfair_coin
## [1] "heads" "tails" "tails" "tails" "tails" "tails" "heads" "tails"
## [9] "tails" "tails" "heads" "tails" "tails" "tails" "tails" "tails"
## [17] "tails" "tails" "tails" "tails" "tails" "tails" "tails" "tails"
## [25] "tails" "heads" "tails" "heads" "tails" "heads" "tails" "tails"
## [33] "tails" "tails" "tails" "tails" "tails" "heads" "tails" "tails"
## [41] "tails" "tails" "tails" "tails" "tails" "tails" "tails" "tails"
## [49] "tails" "tails" "tails" "tails" "heads" "tails" "tails" "tails"
## [57] "tails" "tails" "tails" "tails" "tails" "heads" "heads" "tails"
## [65] "tails" "heads" "tails" "tails" "heads" "tails" "tails" "tails"
## [73] "tails" "tails" "tails" "tails" "tails" "tails" "heads" "tails"
## [81] "heads" "tails" "tails" "heads" "heads" "tails" "tails" "tails"
## [89] "tails" "heads" "heads" "heads" "tails" "tails" "tails" "tails"
## [97] "tails" "tails" "tails" "tails"
table(sim_unfair_coin)
## sim_unfair_coin
## heads tails
## 19 81
#Heads will have a probability of 20% and tails 80%
In your simulation of flipping the unfair coin 100 times, how many flips came up heads?
Tails populated 74 times while Heads populated 26
Simulating the Independent Shooter
#To simulate a single shot from an independent shooter with a shooting percentage of 50% we type
outcomes <- c("H","M")
sim_basket <- sample(outcomes, size=1, replace= TRUE)
sim_basket
## [1] "M"
table(sim_basket)
## sim_basket
## M
## 1
What change needs to be made to the sample function so that it reflects a shooting percentage of 45%? Make this adjustment, then run a simulation to sample 133 shots. Assign the output of this simulation to a new object called sim_basket.
outcomes <- c("H","M")
sim_basket <- sample(outcomes, size=133, replace=TRUE, prob=c(0.45,0.55))
sim_basket
## [1] "M" "M" "H" "H" "H" "M" "H" "H" "H" "M" "H" "H" "H" "H" "H" "H" "H"
## [18] "M" "H" "M" "M" "H" "H" "M" "M" "M" "M" "M" "H" "M" "H" "M" "M" "M"
## [35] "M" "M" "M" "M" "M" "M" "H" "H" "M" "M" "M" "H" "M" "M" "H" "H" "M"
## [52] "M" "M" "M" "H" "H" "M" "H" "H" "H" "H" "M" "H" "H" "M" "M" "M" "M"
## [69] "M" "M" "M" "M" "M" "M" "M" "M" "M" "H" "M" "M" "M" "M" "H" "H" "H"
## [86] "M" "H" "H" "M" "M" "M" "H" "M" "M" "H" "H" "H" "H" "H" "H" "H" "M"
## [103] "M" "H" "H" "H" "H" "M" "M" "M" "H" "M" "H" "M" "M" "M" "M" "H" "M"
## [120] "M" "M" "M" "M" "H" "H" "M" "M" "M" "H" "H" "M" "M" "M"
table(sim_basket)
## sim_basket
## H M
## 56 77
Comparison
kobe$basket
## [1] H M M H H M M M M H H H M H H M M H H H M M H M H H H M M M M M M H M
## [36] H M M H H H H M H M M H M M H M M H M H H M M H M H H M H M M M H M M
## [71] M M H M H M M H M M H H M M M M H H H M M H M M H M H H M H M M H M M
## [106] M H M H H H M H H H M H M H M M M M M M H M H M M M M H
## Levels: H M
sim_basket
## [1] "M" "M" "H" "H" "H" "M" "H" "H" "H" "M" "H" "H" "H" "H" "H" "H" "H"
## [18] "M" "H" "M" "M" "H" "H" "M" "M" "M" "M" "M" "H" "M" "H" "M" "M" "M"
## [35] "M" "M" "M" "M" "M" "M" "H" "H" "M" "M" "M" "H" "M" "M" "H" "H" "M"
## [52] "M" "M" "M" "H" "H" "M" "H" "H" "H" "H" "M" "H" "H" "M" "M" "M" "M"
## [69] "M" "M" "M" "M" "M" "M" "M" "M" "M" "H" "M" "M" "M" "M" "H" "H" "H"
## [86] "M" "H" "H" "M" "M" "M" "H" "M" "M" "H" "H" "H" "H" "H" "H" "H" "M"
## [103] "M" "H" "H" "H" "H" "M" "M" "M" "H" "M" "H" "M" "M" "M" "M" "H" "M"
## [120] "M" "M" "M" "M" "H" "H" "M" "M" "M" "H" "H" "M" "M" "M"