#Task 1 — Create Subsets
data(iris)
#1. Create a subset called setosa containing only observations where
Species == “setosa”.
setosa <- subset(iris, Species == "setosa")
#2. Create a subset called versicolor containing only observations
where Species == “versicolor”.
versicolor <- subset(iris, Species == "versicolor")
#3. Report: The sample size of each subset. The sample mean of
Sepal.Length for each subset.
n_setosa <- nrow(setosa)
n_versicolor <- nrow(versicolor)
mean_setosa <- mean(setosa$Sepal.Length)
mean_versicolor <- mean(versicolor$Sepal.Length)
n_setosa
[1] 50
n_versicolor
[1] 50
mean_setosa
[1] 5.006
mean_versicolor
[1] 5.936
#Task 2-One-Sample t-Test Confidence Interval #1.
versicolor_test <- t.test(versicolor$Sepal.Length, conf.level = 0.90)
versicolor_test
One Sample t-test
data: versicolor$Sepal.Length
t = 81.318, df = 49, p-value < 2.2e-16
alternative hypothesis: true mean is not equal to 0
90 percent confidence interval:
5.813616 6.058384
sample estimates:
mean of x
5.936
#2. # Sample mean: 5.936 # 90% confidence interval: (5.813616,
6.058384) # Degrees of freedom: 49
versicolor_test$estimate
mean of x
5.936
versicolor_test$conf.int
[1] 5.813616 6.058384
attr(,"conf.level")
[1] 0.9
versicolor_test$parameter
df
49
#Task 3 - Two-Sample Welch t-Test #1.
two_sample_test <- t.test(setosa$Sepal.Length, versicolor$Sepal.Length)
two_sample_test
Welch Two Sample t-test
data: setosa$Sepal.Length and versicolor$Sepal.Length
t = -10.521, df = 86.538, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
-1.1057074 -0.7542926
sample estimates:
mean of x mean of y
5.006 5.936
two_sample_test$estimate
mean of x mean of y
5.006 5.936
two_sample_test$conf.int
[1] -1.1057074 -0.7542926
attr(,"conf.level")
[1] 0.95
two_sample_test$p.value
[1] 3.746743e-17
#2 #The estimated difference in means (setosa − versicolor):0.93 #
95% confidence interval for the difference: (-1.1057074 -0.7542926) #
p-value: 3.746743e-17
#3 #The estimated difference in means is approximately -0.93, meaning
that setosa sepals are about 0.93 units shorter than versicolor sepals.
The 95% confidence interval for the difference is (-1.106, -.754). Since
this confidence interval does not include 0, it suggests a difference
between groups. The p-value is extremely small (3.75e-17), which is much
smaller than .05. Therefore, it is statistically significant that the
mean Sepal.Length differs between setosa and versicolor. The data
provided evidence that versicolor flowers have longer sepals on average
than setosa flowers.
#Task 4 #(a) #1.In this context the Type I error that occurs is that
when it comes to rejecting the null hypothesis that the means are equal
it’s difficult as they are equal.
#2. If α = 0.05, the probability of making a Type I error would be
5%.
#3. Rejecting the null hypothesis would be a mistake as it says that
they are different when they are actually the same.
#(b)
data(iris)
setosa <- iris[iris$Species == "setosa", "Sepal.Length"]
versicolor <- iris[iris$Species == "versicolor", "Sepal.Length"]
#Pooled
pooled <- c(setosa, versicolor)
set.seed(2026)
nrep <- 100
rejections <- integer(nrep)
for (i in 1:nrep) {
# shuffle values
shuffled <- sample(pooled)
#Two group of size 50
g1 <- shuffled[1:50]
g2 <- shuffled[51:100]
#t-test
t_res <- t.test(g1, g2)
rejections[i] <- as.integer(t_res$p.value < 0.05)
}
num_rejections <- sum(rejections)
Prop_rejections <- mean(rejections)
num_rejections
[1] 6
Prop_rejections
[1] 0.06
LS0tCnRpdGxlOiAiUiBwcm9qZWN0IDIiCiNOYW1lczogU2FyYWggSGFtaWx0b24sIERpYW5hIFF1ZXphZGEsIERhbmllbGEgQ2FsaXh0byAgCm91dHB1dDoKICBodG1sX25vdGVib29rOiBkZWZhdWx0CiAgcGRmX2RvY3VtZW50OiBkZWZhdWx0Ci0tLQojVGFzayAxIOKAlCBDcmVhdGUgU3Vic2V0cwpgYGB7cn0KZGF0YShpcmlzKQpgYGAKIzEuIENyZWF0ZSBhIHN1YnNldCBjYWxsZWQgc2V0b3NhIGNvbnRhaW5pbmcgb25seSBvYnNlcnZhdGlvbnMgd2hlcmUgU3BlY2llcyA9PSAic2V0b3NhIi4KYGBge3J9CnNldG9zYSA8LSBzdWJzZXQoaXJpcywgU3BlY2llcyA9PSAic2V0b3NhIikKYGBgCiMyLiBDcmVhdGUgYSBzdWJzZXQgY2FsbGVkIHZlcnNpY29sb3IgY29udGFpbmluZyBvbmx5IG9ic2VydmF0aW9ucyB3aGVyZSBTcGVjaWVzID09ICJ2ZXJzaWNvbG9yIi4KYGBge3J9CnZlcnNpY29sb3IgPC0gc3Vic2V0KGlyaXMsIFNwZWNpZXMgPT0gInZlcnNpY29sb3IiKQpgYGAKIzMuIFJlcG9ydDogVGhlIHNhbXBsZSBzaXplIG9mIGVhY2ggc3Vic2V0LiBUaGUgc2FtcGxlIG1lYW4gb2YgU2VwYWwuTGVuZ3RoIGZvciBlYWNoIHN1YnNldC4KYGBge3J9Cm5fc2V0b3NhIDwtIG5yb3coc2V0b3NhKQpuX3ZlcnNpY29sb3IgPC0gbnJvdyh2ZXJzaWNvbG9yKQpgYGAKCmBgYHtyfQptZWFuX3NldG9zYSA8LSBtZWFuKHNldG9zYSRTZXBhbC5MZW5ndGgpCm1lYW5fdmVyc2ljb2xvciA8LSBtZWFuKHZlcnNpY29sb3IkU2VwYWwuTGVuZ3RoKQpgYGAKCmBgYHtyfQpuX3NldG9zYQpuX3ZlcnNpY29sb3IKbWVhbl9zZXRvc2EKbWVhbl92ZXJzaWNvbG9yCmBgYAojVGFzayAyLU9uZS1TYW1wbGUgdC1UZXN0IENvbmZpZGVuY2UgSW50ZXJ2YWwKIzEuCmBgYHtyfQp2ZXJzaWNvbG9yX3Rlc3QgPC0gdC50ZXN0KHZlcnNpY29sb3IkU2VwYWwuTGVuZ3RoLCBjb25mLmxldmVsID0gMC45MCkKCnZlcnNpY29sb3JfdGVzdApgYGAKIzIuCiMgU2FtcGxlIG1lYW46IDUuOTM2CiMgOTAlIGNvbmZpZGVuY2UgaW50ZXJ2YWw6ICg1LjgxMzYxNiwgNi4wNTgzODQpCiMgRGVncmVlcyBvZiBmcmVlZG9tOiA0OQoKYGBge3J9CnZlcnNpY29sb3JfdGVzdCRlc3RpbWF0ZSAgIAp2ZXJzaWNvbG9yX3Rlc3QkY29uZi5pbnQKdmVyc2ljb2xvcl90ZXN0JHBhcmFtZXRlciAKYGBgCiNUYXNrIDMgLSBUd28tU2FtcGxlIFdlbGNoIHQtVGVzdAojMS4KYGBge3J9CnR3b19zYW1wbGVfdGVzdCA8LSB0LnRlc3Qoc2V0b3NhJFNlcGFsLkxlbmd0aCwgdmVyc2ljb2xvciRTZXBhbC5MZW5ndGgpCgp0d29fc2FtcGxlX3Rlc3QKCmBgYAoKYGBge3J9CnR3b19zYW1wbGVfdGVzdCRlc3RpbWF0ZQp0d29fc2FtcGxlX3Rlc3QkY29uZi5pbnQKdHdvX3NhbXBsZV90ZXN0JHAudmFsdWUKYGBgCiMyIAojVGhlIGVzdGltYXRlZCBkaWZmZXJlbmNlIGluIG1lYW5zIChzZXRvc2Eg4oiSIHZlcnNpY29sb3IpOjAuOTMKIyA5NSUgY29uZmlkZW5jZSBpbnRlcnZhbCBmb3IgdGhlIGRpZmZlcmVuY2U6ICgtMS4xMDU3MDc0IC0wLjc1NDI5MjYpCiMgcC12YWx1ZTogMy43NDY3NDNlLTE3CgojMyAKI1RoZSBlc3RpbWF0ZWQgZGlmZmVyZW5jZSBpbiBtZWFucyBpcyBhcHByb3hpbWF0ZWx5IC0wLjkzLCBtZWFuaW5nIHRoYXQgc2V0b3NhIHNlcGFscyBhcmUgYWJvdXQgMC45MyB1bml0cyBzaG9ydGVyIHRoYW4gdmVyc2ljb2xvciBzZXBhbHMuIFRoZSA5NSUgY29uZmlkZW5jZSBpbnRlcnZhbCBmb3IgdGhlIGRpZmZlcmVuY2UgaXMgKC0xLjEwNiwgLS43NTQpLiBTaW5jZSB0aGlzIGNvbmZpZGVuY2UgaW50ZXJ2YWwgZG9lcyBub3QgaW5jbHVkZSAwLCBpdCBzdWdnZXN0cyBhIGRpZmZlcmVuY2UgYmV0d2VlbiBncm91cHMuIFRoZSBwLXZhbHVlIGlzIGV4dHJlbWVseSBzbWFsbCAoMy43NWUtMTcpLCB3aGljaCBpcyBtdWNoIHNtYWxsZXIgdGhhbiAuMDUuIFRoZXJlZm9yZSwgaXQgaXMgc3RhdGlzdGljYWxseSBzaWduaWZpY2FudCB0aGF0IHRoZSBtZWFuIFNlcGFsLkxlbmd0aCBkaWZmZXJzIGJldHdlZW4gc2V0b3NhIGFuZCB2ZXJzaWNvbG9yLiBUaGUgZGF0YSBwcm92aWRlZCBldmlkZW5jZSB0aGF0IHZlcnNpY29sb3IgZmxvd2VycyBoYXZlIGxvbmdlciBzZXBhbHMgb24gYXZlcmFnZSB0aGFuIHNldG9zYSBmbG93ZXJzLgoKI1Rhc2sgNAojKGEpCiMxLkluIHRoaXMgY29udGV4dCB0aGUgVHlwZSBJIGVycm9yIHRoYXQgb2NjdXJzIGlzIHRoYXQgd2hlbiBpdCBjb21lcyB0byByZWplY3RpbmcgdGhlIG51bGwgaHlwb3RoZXNpcyB0aGF0IHRoZSBtZWFucyBhcmUgZXF1YWwgaXQncyBkaWZmaWN1bHQgYXMgdGhleSBhcmUgZXF1YWwuCgojMi4gSWYgzrEgPSAwLjA1LCB0aGUgcHJvYmFiaWxpdHkgb2YgbWFraW5nIGEgVHlwZSBJIGVycm9yIHdvdWxkIGJlIDUlLiAKCiMzLiBSZWplY3RpbmcgdGhlIG51bGwgaHlwb3RoZXNpcyB3b3VsZCBiZSBhIG1pc3Rha2UgYXMgaXQgc2F5cyB0aGF0IHRoZXkgYXJlIGRpZmZlcmVudCB3aGVuIHRoZXkgYXJlIGFjdHVhbGx5IHRoZSBzYW1lLgoKIyhiKQpgYGB7cn0KZGF0YShpcmlzKQoKc2V0b3NhIDwtIGlyaXNbaXJpcyRTcGVjaWVzID09ICJzZXRvc2EiLCAiU2VwYWwuTGVuZ3RoIl0KdmVyc2ljb2xvciA8LSBpcmlzW2lyaXMkU3BlY2llcyA9PSAidmVyc2ljb2xvciIsICJTZXBhbC5MZW5ndGgiXQoKI1Bvb2xlZCAKcG9vbGVkIDwtIGMoc2V0b3NhLCB2ZXJzaWNvbG9yKQoKc2V0LnNlZWQoMjAyNikKCm5yZXAgPC0gMTAwCnJlamVjdGlvbnMgPC0gaW50ZWdlcihucmVwKQoKZm9yIChpIGluIDE6bnJlcCkgewojIHNodWZmbGUgdmFsdWVzCiAgc2h1ZmZsZWQgPC0gc2FtcGxlKHBvb2xlZCkKCiNUd28gZ3JvdXAgb2Ygc2l6ZSA1MAogIGcxIDwtIHNodWZmbGVkWzE6NTBdCiAgZzIgPC0gc2h1ZmZsZWRbNTE6MTAwXQoKI3QtdGVzdAogIHRfcmVzIDwtIHQudGVzdChnMSwgZzIpCiAgCiAgcmVqZWN0aW9uc1tpXSA8LSBhcy5pbnRlZ2VyKHRfcmVzJHAudmFsdWUgPCAwLjA1KQp9CgpudW1fcmVqZWN0aW9ucyA8LSBzdW0ocmVqZWN0aW9ucykKUHJvcF9yZWplY3Rpb25zIDwtIG1lYW4ocmVqZWN0aW9ucykKCm51bV9yZWplY3Rpb25zIApQcm9wX3JlamVjdGlvbnMKYGBgCgoK