#Case-scenario 1
#This is the fourth season of outfielder Luis Robert with the Chicago White Socks. If during the first three seasons he hit 11, 13, and 12 home runs, how many does he need on this season for his overall average to be at least 20?

#Solution
# Home-runs so far
HR_before <- c(11, 13, 12)
# Average Number of Home-runs per season wanted
wanted_HR <- 20
# Number of seasons
n_seasons <- 4
# Needed Home-runs on season 4
x_4 <- n_seasons*wanted_HR - sum(HR_before)
# Minimum number of Home-runs needed by Robert
x_4
[1] 44
# Robert's performance
Robert_HRs <- c(11, 13, 12,44)
# Find mean
mean(Robert_HRs)
[1] 20
# Find standard deviation
sd(Robert_HRs)
[1] 16.02082
# Find the maximum number of home-runs during the four seasons period
max(Robert_HRs)
[1] 44
# Find the minimum number of home-runs during the four seasons period
min(Robert_HRs)
[1] 11
summary(Robert_HRs)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  11.00   11.75   12.50   20.00   20.75   44.00 
#Question 1
#Now, I must complete the problem below which represents a similar case scenario. 

#This is the sixth season of outfielder Juan Soto in the majors. If during the first five seasons he received 79, 108,41,145, and 135 walks, how many does he need on this season for his overall number of walks per season to be at least 100?

# Walks for Juan Soto
Soto_walks <- c(79, 108, 41, 145, 135)
n_seasons  <- 6
desired_walks <- 100

# Sum of the first five seasons
sum_first5 <- sum(Soto_walks)

# Solve for x6
x_6 <- n_seasons * desired_walks - sum_first5
x_6
[1] 92
#Case-scenario 2
The average salary of 10 baseball players is 72,000 dollars a week and the average salary of 4 soccer players is 84,000. Find the mean salary of all 14 professional players.
n_1 <- 10
n_2 <- 4
y_1 <- 72000
y_2 <- 84000
# Mean salary overall
salary_ave <-  (n_1*y_1 + n_2*y_2)/(n_1+n_2)
salary_ave
[1] 75428.57
#The average salary of 7 basketball players is 102,000 dollars a week and the average salary of 9 NFL players is 91,000. Find the mean salary of all 16 professional players.

n_bb  <- 7     # number of basketball players
y_bb  <- 102000 # average basketball salary
n_nfl <- 9     # number of NFL players
y_nfl <- 91000  # average NFL salary

# Combine
combined_mean <- (n_bb*y_bb + n_nfl*y_nfl)/(n_bb + n_nfl)
combined_mean
[1] 95812.5
#Case-scenario 3
#The frequency distribution below lists the number of active players in the Barclays Premier League and the time left in their contract.

Years   Number of players
6   28
5   72
4   201
3   109
2   56
1   34

Q1.Find the mean,the median and the standard deviation.

Q2. What percentage of the data lies within one standard deviation of the mean?

Q3. What percentage of the data lies within two standard deviations of the mean?

Q4. What percent of the data lies within three standard deviations of the mean?

Q5. Draw a histogram to illustrate the data.
contract_length <- read.table("allcontracts.csv", header = TRUE, sep = ",")
contract_years <- contract_length$years
# Mean 
contracts_mean  <- mean(contract_years)
contracts_mean
[1] 3.458918
# Median
contracts_median <- median(contract_years)
contracts_median
[1] 3
# Find number of observations
contracts_n <- length(contract_years)
# Find standard deviation
contracts_sd <- sd(contract_years)
contracts_w1sd <- sum((contract_years - contracts_mean)/contracts_sd < 1)/ contracts_n
# Percentage of observation within one standard deviation of the mean
contracts_w1sd
[1] 0.8416834
## Difference from empirical 
contracts_w1sd - 0.68
[1] 0.1616834
## Within 2 sd
contracts_w2sd <- sum((contract_years - contracts_mean)/ contracts_sd < 2)/contracts_n
contracts_w2sd
[1] 1
## Difference from empirical 
contracts_w2sd - 0.95
[1] 0.05
## Within 3 sd 
contracts_w3sd <- sum((contract_years - contracts_mean)/ contracts_sd < 3)/contracts_n
contracts_w3sd
[1] 1
## Difference from empirical 
contracts_w3sd - 0.9973
[1] 0.0027
# Create histogram
hist(contract_years,xlab = "Years Left in Contract",col = "green",border = "red", xlim = c(0,8), ylim = c(0,225),
   breaks = 5)

# 1) Read the CSV file

doubles_data <- read.csv("doubles_hit.csv", header = TRUE)
# 2) Extract the relevant column

my_doubles <- doubles_data$doubles  
# 3) Calculate basic statistics

doubles_mean   <- mean(my_doubles)    # Mean
doubles_median <- median(my_doubles)  # Median
doubles_sd     <- sd(my_doubles)      # Standard Deviation
doubles_n      <- length(my_doubles)  # Number of observations

# Print out results
doubles_mean
[1] 23.55
doubles_median
[1] 23.5
doubles_sd
[1] 13.37371
doubles_n
[1] 100
# 4) Calculate % of data within 1, 2, and 3 SDs of the mean using absolute value ensures we look at both sides of the mean.
doubles_w1sd <- sum(abs(my_doubles - doubles_mean) / doubles_sd < 1) / doubles_n
doubles_w2sd <- sum(abs(my_doubles - doubles_mean) / doubles_sd < 2) / doubles_n
doubles_w3sd <- sum(abs(my_doubles - doubles_mean) / doubles_sd < 3) / doubles_n

doubles_w1sd
[1] 0.58
doubles_w2sd
[1] 1
doubles_w3sd
[1] 1
# Optionally compare to Empirical Rule (68%, 95%, 99.7%)
doubles_w1sd - 0.68
[1] -0.1
doubles_w2sd - 0.95
[1] 0.05
doubles_w3sd - 0.9973
[1] 0.0027
# 5) Draw a histogram of the doubles hit

hist(my_doubles,
     main  = "Histogram of Doubles Hit",
     xlab  = "Number of Doubles",
     breaks = 10   
     )

LS0tCnRpdGxlOiAiR2V0dGluZyBTdGFydGVkIFdpdGggUiBQYXJ0IDIiCm91dHB1dDogaHRtbF9ub3RlYm9vawotLS0KCgpgYGB7cn0KI0Nhc2Utc2NlbmFyaW8gMQojVGhpcyBpcyB0aGUgZm91cnRoIHNlYXNvbiBvZiBvdXRmaWVsZGVyIEx1aXMgUm9iZXJ0IHdpdGggdGhlIENoaWNhZ28gV2hpdGUgU29ja3MuIElmIGR1cmluZyB0aGUgZmlyc3QgdGhyZWUgc2Vhc29ucyBoZSBoaXQgMTEsIDEzLCBhbmQgMTIgaG9tZSBydW5zLCBob3cgbWFueSBkb2VzIGhlIG5lZWQgb24gdGhpcyBzZWFzb24gZm9yIGhpcyBvdmVyYWxsIGF2ZXJhZ2UgdG8gYmUgYXQgbGVhc3QgMjA/CgojU29sdXRpb24KIyBIb21lLXJ1bnMgc28gZmFyCkhSX2JlZm9yZSA8LSBjKDExLCAxMywgMTIpCiMgQXZlcmFnZSBOdW1iZXIgb2YgSG9tZS1ydW5zIHBlciBzZWFzb24gd2FudGVkCndhbnRlZF9IUiA8LSAyMAojIE51bWJlciBvZiBzZWFzb25zCm5fc2Vhc29ucyA8LSA0CiMgTmVlZGVkIEhvbWUtcnVucyBvbiBzZWFzb24gNAp4XzQgPC0gbl9zZWFzb25zKndhbnRlZF9IUiAtIHN1bShIUl9iZWZvcmUpCiMgTWluaW11bSBudW1iZXIgb2YgSG9tZS1ydW5zIG5lZWRlZCBieSBSb2JlcnQKeF80CmBgYApgYGB7cn0KIyBSb2JlcnQncyBwZXJmb3JtYW5jZQpSb2JlcnRfSFJzIDwtIGMoMTEsIDEzLCAxMiw0NCkKIyBGaW5kIG1lYW4KbWVhbihSb2JlcnRfSFJzKQpgYGAKYGBge3J9CiMgRmluZCBzdGFuZGFyZCBkZXZpYXRpb24Kc2QoUm9iZXJ0X0hScykKYGBgCmBgYHtyfQojIEZpbmQgdGhlIG1heGltdW0gbnVtYmVyIG9mIGhvbWUtcnVucyBkdXJpbmcgdGhlIGZvdXIgc2Vhc29ucyBwZXJpb2QKbWF4KFJvYmVydF9IUnMpCmBgYApgYGB7cn0KIyBGaW5kIHRoZSBtaW5pbXVtIG51bWJlciBvZiBob21lLXJ1bnMgZHVyaW5nIHRoZSBmb3VyIHNlYXNvbnMgcGVyaW9kCm1pbihSb2JlcnRfSFJzKQpgYGAKYGBge3J9CnN1bW1hcnkoUm9iZXJ0X0hScykKYGBgCmBgYHtyfQojUXVlc3Rpb24gMQojTm93LCBJIG11c3QgY29tcGxldGUgdGhlIHByb2JsZW0gYmVsb3cgd2hpY2ggcmVwcmVzZW50cyBhIHNpbWlsYXIgY2FzZSBzY2VuYXJpby4gCgojVGhpcyBpcyB0aGUgc2l4dGggc2Vhc29uIG9mIG91dGZpZWxkZXIgSnVhbiBTb3RvIGluIHRoZSBtYWpvcnMuIElmIGR1cmluZyB0aGUgZmlyc3QgZml2ZSBzZWFzb25zIGhlIHJlY2VpdmVkIDc5LCAxMDgsNDEsMTQ1LCBhbmQgMTM1IHdhbGtzLCBob3cgbWFueSBkb2VzIGhlIG5lZWQgb24gdGhpcyBzZWFzb24gZm9yIGhpcyBvdmVyYWxsIG51bWJlciBvZiB3YWxrcyBwZXIgc2Vhc29uIHRvIGJlIGF0IGxlYXN0IDEwMD8KCiMgV2Fsa3MgZm9yIEp1YW4gU290bwpTb3RvX3dhbGtzIDwtIGMoNzksIDEwOCwgNDEsIDE0NSwgMTM1KQpuX3NlYXNvbnMgIDwtIDYKZGVzaXJlZF93YWxrcyA8LSAxMDAKCiMgU3VtIG9mIHRoZSBmaXJzdCBmaXZlIHNlYXNvbnMKc3VtX2ZpcnN0NSA8LSBzdW0oU290b193YWxrcykKCiMgU29sdmUgZm9yIHg2CnhfNiA8LSBuX3NlYXNvbnMgKiBkZXNpcmVkX3dhbGtzIC0gc3VtX2ZpcnN0NQp4XzYKYGBgCgpgYGB7cn0KI0Nhc2Utc2NlbmFyaW8gMgpUaGUgYXZlcmFnZSBzYWxhcnkgb2YgMTAgYmFzZWJhbGwgcGxheWVycyBpcyA3MiwwMDAgZG9sbGFycyBhIHdlZWsgYW5kIHRoZSBhdmVyYWdlIHNhbGFyeSBvZiA0IHNvY2NlciBwbGF5ZXJzIGlzIDg0LDAwMC4gRmluZCB0aGUgbWVhbiBzYWxhcnkgb2YgYWxsIDE0IHByb2Zlc3Npb25hbCBwbGF5ZXJzLgpgYGAKCgpgYGB7cn0Kbl8xIDwtIDEwCm5fMiA8LSA0CnlfMSA8LSA3MjAwMAp5XzIgPC0gODQwMDAKIyBNZWFuIHNhbGFyeSBvdmVyYWxsCnNhbGFyeV9hdmUgPC0gIChuXzEqeV8xICsgbl8yKnlfMikvKG5fMStuXzIpCnNhbGFyeV9hdmUKYGBgCgoKYGBge3J9CiNUaGUgYXZlcmFnZSBzYWxhcnkgb2YgNyBiYXNrZXRiYWxsIHBsYXllcnMgaXMgMTAyLDAwMCBkb2xsYXJzIGEgd2VlayBhbmQgdGhlIGF2ZXJhZ2Ugc2FsYXJ5IG9mIDkgTkZMIHBsYXllcnMgaXMgOTEsMDAwLiBGaW5kIHRoZSBtZWFuIHNhbGFyeSBvZiBhbGwgMTYgcHJvZmVzc2lvbmFsIHBsYXllcnMuCgpuX2JiICA8LSA3ICAgICAjIG51bWJlciBvZiBiYXNrZXRiYWxsIHBsYXllcnMKeV9iYiAgPC0gMTAyMDAwICMgYXZlcmFnZSBiYXNrZXRiYWxsIHNhbGFyeQpuX25mbCA8LSA5ICAgICAjIG51bWJlciBvZiBORkwgcGxheWVycwp5X25mbCA8LSA5MTAwMCAgIyBhdmVyYWdlIE5GTCBzYWxhcnkKCiMgQ29tYmluZQpjb21iaW5lZF9tZWFuIDwtIChuX2JiKnlfYmIgKyBuX25mbCp5X25mbCkvKG5fYmIgKyBuX25mbCkKY29tYmluZWRfbWVhbgoKYGBgCgoKYGBge3J9CiNDYXNlLXNjZW5hcmlvIDMKI1RoZSBmcmVxdWVuY3kgZGlzdHJpYnV0aW9uIGJlbG93IGxpc3RzIHRoZSBudW1iZXIgb2YgYWN0aXZlIHBsYXllcnMgaW4gdGhlIEJhcmNsYXlzIFByZW1pZXIgTGVhZ3VlIGFuZCB0aGUgdGltZSBsZWZ0IGluIHRoZWlyIGNvbnRyYWN0LgoKWWVhcnMJTnVtYmVyIG9mIHBsYXllcnMKNgkyOAo1CTcyCjQJMjAxCjMJMTA5CjIJNTYKMQkzNAoKUTEuRmluZCB0aGUgbWVhbix0aGUgbWVkaWFuIGFuZCB0aGUgc3RhbmRhcmQgZGV2aWF0aW9uLgoKUTIuIFdoYXQgcGVyY2VudGFnZSBvZiB0aGUgZGF0YSBsaWVzIHdpdGhpbiBvbmUgc3RhbmRhcmQgZGV2aWF0aW9uIG9mIHRoZSBtZWFuPwoKUTMuIFdoYXQgcGVyY2VudGFnZSBvZiB0aGUgZGF0YSBsaWVzIHdpdGhpbiB0d28gc3RhbmRhcmQgZGV2aWF0aW9ucyBvZiB0aGUgbWVhbj8KClE0LiBXaGF0IHBlcmNlbnQgb2YgdGhlIGRhdGEgbGllcyB3aXRoaW4gdGhyZWUgc3RhbmRhcmQgZGV2aWF0aW9ucyBvZiB0aGUgbWVhbj8KClE1LiBEcmF3IGEgaGlzdG9ncmFtIHRvIGlsbHVzdHJhdGUgdGhlIGRhdGEuCmBgYAoKCmBgYHtyfQpjb250cmFjdF9sZW5ndGggPC0gcmVhZC50YWJsZSgiYWxsY29udHJhY3RzLmNzdiIsIGhlYWRlciA9IFRSVUUsIHNlcCA9ICIsIikKY29udHJhY3RfeWVhcnMgPC0gY29udHJhY3RfbGVuZ3RoJHllYXJzCmBgYAoKYGBge3J9CiMgTWVhbiAKY29udHJhY3RzX21lYW4gIDwtIG1lYW4oY29udHJhY3RfeWVhcnMpCmNvbnRyYWN0c19tZWFuCmBgYAoKYGBge3J9CiMgTWVkaWFuCmNvbnRyYWN0c19tZWRpYW4gPC0gbWVkaWFuKGNvbnRyYWN0X3llYXJzKQpjb250cmFjdHNfbWVkaWFuCmBgYApgYGB7cn0KIyBGaW5kIG51bWJlciBvZiBvYnNlcnZhdGlvbnMKY29udHJhY3RzX24gPC0gbGVuZ3RoKGNvbnRyYWN0X3llYXJzKQojIEZpbmQgc3RhbmRhcmQgZGV2aWF0aW9uCmNvbnRyYWN0c19zZCA8LSBzZChjb250cmFjdF95ZWFycykKYGBgCgpgYGB7cn0KY29udHJhY3RzX3cxc2QgPC0gc3VtKChjb250cmFjdF95ZWFycyAtIGNvbnRyYWN0c19tZWFuKS9jb250cmFjdHNfc2QgPCAxKS8gY29udHJhY3RzX24KIyBQZXJjZW50YWdlIG9mIG9ic2VydmF0aW9uIHdpdGhpbiBvbmUgc3RhbmRhcmQgZGV2aWF0aW9uIG9mIHRoZSBtZWFuCmNvbnRyYWN0c193MXNkCmBgYApgYGB7cn0KIyMgRGlmZmVyZW5jZSBmcm9tIGVtcGlyaWNhbCAKY29udHJhY3RzX3cxc2QgLSAwLjY4CmBgYApgYGB7cn0KIyMgV2l0aGluIDIgc2QKY29udHJhY3RzX3cyc2QgPC0gc3VtKChjb250cmFjdF95ZWFycyAtIGNvbnRyYWN0c19tZWFuKS8gY29udHJhY3RzX3NkIDwgMikvY29udHJhY3RzX24KY29udHJhY3RzX3cyc2QKYGBgCmBgYHtyfQojIyBEaWZmZXJlbmNlIGZyb20gZW1waXJpY2FsIApjb250cmFjdHNfdzJzZCAtIDAuOTUKYGBgCmBgYHtyfQojIyBXaXRoaW4gMyBzZCAKY29udHJhY3RzX3czc2QgPC0gc3VtKChjb250cmFjdF95ZWFycyAtIGNvbnRyYWN0c19tZWFuKS8gY29udHJhY3RzX3NkIDwgMykvY29udHJhY3RzX24KY29udHJhY3RzX3czc2QKYGBgCmBgYHtyfQojIyBEaWZmZXJlbmNlIGZyb20gZW1waXJpY2FsIApjb250cmFjdHNfdzNzZCAtIDAuOTk3MwpgYGAKYGBge3J9CiMgQ3JlYXRlIGhpc3RvZ3JhbQpoaXN0KGNvbnRyYWN0X3llYXJzLHhsYWIgPSAiWWVhcnMgTGVmdCBpbiBDb250cmFjdCIsY29sID0gImdyZWVuIixib3JkZXIgPSAicmVkIiwgeGxpbSA9IGMoMCw4KSwgeWxpbSA9IGMoMCwyMjUpLAogICBicmVha3MgPSA1KQpgYGAKYGBge3J9CiMgMSkgUmVhZCB0aGUgQ1NWIGZpbGUKCmRvdWJsZXNfZGF0YSA8LSByZWFkLmNzdigiZG91Ymxlc19oaXQuY3N2IiwgaGVhZGVyID0gVFJVRSkKYGBgCgpgYGB7cn0KIyAyKSBFeHRyYWN0IHRoZSByZWxldmFudCBjb2x1bW4KCm15X2RvdWJsZXMgPC0gZG91Ymxlc19kYXRhJGRvdWJsZXMgIApgYGAKCmBgYHtyfQojIDMpIENhbGN1bGF0ZSBiYXNpYyBzdGF0aXN0aWNzCgpkb3VibGVzX21lYW4gICA8LSBtZWFuKG15X2RvdWJsZXMpICAgICMgTWVhbgpkb3VibGVzX21lZGlhbiA8LSBtZWRpYW4obXlfZG91YmxlcykgICMgTWVkaWFuCmRvdWJsZXNfc2QgICAgIDwtIHNkKG15X2RvdWJsZXMpICAgICAgIyBTdGFuZGFyZCBEZXZpYXRpb24KZG91Ymxlc19uICAgICAgPC0gbGVuZ3RoKG15X2RvdWJsZXMpICAjIE51bWJlciBvZiBvYnNlcnZhdGlvbnMKCiMgUHJpbnQgb3V0IHJlc3VsdHMKZG91Ymxlc19tZWFuCmRvdWJsZXNfbWVkaWFuCmRvdWJsZXNfc2QKZG91Ymxlc19uCmBgYApgYGB7cn0KIyA0KSBDYWxjdWxhdGUgJSBvZiBkYXRhIHdpdGhpbiAxLCAyLCBhbmQgMyBTRHMgb2YgdGhlIG1lYW4gdXNpbmcgYWJzb2x1dGUgdmFsdWUgZW5zdXJlcyB3ZSBsb29rIGF0IGJvdGggc2lkZXMgb2YgdGhlIG1lYW4uCmRvdWJsZXNfdzFzZCA8LSBzdW0oYWJzKG15X2RvdWJsZXMgLSBkb3VibGVzX21lYW4pIC8gZG91Ymxlc19zZCA8IDEpIC8gZG91Ymxlc19uCmRvdWJsZXNfdzJzZCA8LSBzdW0oYWJzKG15X2RvdWJsZXMgLSBkb3VibGVzX21lYW4pIC8gZG91Ymxlc19zZCA8IDIpIC8gZG91Ymxlc19uCmRvdWJsZXNfdzNzZCA8LSBzdW0oYWJzKG15X2RvdWJsZXMgLSBkb3VibGVzX21lYW4pIC8gZG91Ymxlc19zZCA8IDMpIC8gZG91Ymxlc19uCgpkb3VibGVzX3cxc2QKZG91Ymxlc193MnNkCmRvdWJsZXNfdzNzZAoKIyBPcHRpb25hbGx5IGNvbXBhcmUgdG8gRW1waXJpY2FsIFJ1bGUgKDY4JSwgOTUlLCA5OS43JSkKZG91Ymxlc193MXNkIC0gMC42OApkb3VibGVzX3cyc2QgLSAwLjk1CmRvdWJsZXNfdzNzZCAtIDAuOTk3MwpgYGAKYGBge3J9CiMgNSkgRHJhdyBhIGhpc3RvZ3JhbSBvZiB0aGUgZG91YmxlcyBoaXQKCmhpc3QobXlfZG91YmxlcywKICAgICBtYWluICA9ICJIaXN0b2dyYW0gb2YgRG91YmxlcyBIaXQiLAogICAgIHhsYWIgID0gIk51bWJlciBvZiBEb3VibGVzIiwKICAgICBicmVha3MgPSAxMCAgIAogICAgICkKYGBgCgoKCg==