library(openintro)
## Warning: package 'openintro' was built under R version 4.2.3
## Loading required package: airports
## Warning: package 'airports' was built under R version 4.2.3
## Loading required package: cherryblossom
## Warning: package 'cherryblossom' was built under R version 4.2.3
## Loading required package: usdata
## Warning: package 'usdata' was built under R version 4.2.3
yrbss
## # A tibble: 13,583 × 13
## age gender grade hispanic race height weight helme…¹ text_…² physi…³
## <int> <chr> <chr> <chr> <chr> <dbl> <dbl> <chr> <chr> <int>
## 1 14 female 9 not Black or A… NA NA never 0 4
## 2 14 female 9 not Black or A… NA NA never <NA> 2
## 3 15 female 9 hispanic Native Haw… 1.73 84.4 never 30 7
## 4 15 female 9 not Black or A… 1.6 55.8 never 0 0
## 5 15 female 9 not Black or A… 1.5 46.7 did no… did no… 2
## 6 15 female 9 not Black or A… 1.57 67.1 did no… did no… 1
## 7 15 female 9 not Black or A… 1.65 132. did no… <NA> 4
## 8 14 male 9 not Black or A… 1.88 71.2 never <NA> 4
## 9 15 male 9 not Black or A… 1.75 63.5 never <NA> 5
## 10 15 male 10 not Black or A… 1.37 97.1 did no… <NA> 0
## # … with 13,573 more rows, 3 more variables: hours_tv_per_school_day <chr>,
## # strength_training_7d <int>, school_night_hours_sleep <chr>, and abbreviated
## # variable names ¹helmet_12m, ²text_while_driving_30d, ³physically_active_7d
str(yrbss)
## tibble [13,583 × 13] (S3: tbl_df/tbl/data.frame)
## $ age : int [1:13583] 14 14 15 15 15 15 15 14 15 15 ...
## $ gender : chr [1:13583] "female" "female" "female" "female" ...
## $ grade : chr [1:13583] "9" "9" "9" "9" ...
## $ hispanic : chr [1:13583] "not" "not" "hispanic" "not" ...
## $ race : chr [1:13583] "Black or African American" "Black or African American" "Native Hawaiian or Other Pacific Islander" "Black or African American" ...
## $ height : num [1:13583] NA NA 1.73 1.6 1.5 1.57 1.65 1.88 1.75 1.37 ...
## $ weight : num [1:13583] NA NA 84.4 55.8 46.7 ...
## $ helmet_12m : chr [1:13583] "never" "never" "never" "never" ...
## $ text_while_driving_30d : chr [1:13583] "0" NA "30" "0" ...
## $ physically_active_7d : int [1:13583] 4 2 7 0 2 1 4 4 5 0 ...
## $ hours_tv_per_school_day : chr [1:13583] "5+" "5+" "5+" "2" ...
## $ strength_training_7d : int [1:13583] 0 0 0 0 1 0 2 0 3 0 ...
## $ school_night_hours_sleep: chr [1:13583] "8" "6" "<5" "6" ...
yrbss1<-na.omit(yrbss)
aggregate(yrbss1$age, list(yrbss1$gender), mean)
## Group.1 x
## 1 female 16.15362
## 2 male 16.28290
or
library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
yrbss1%>%
group_by(gender)%>%
summarize(mean(age))
## # A tibble: 2 × 2
## gender `mean(age)`
## <chr> <dbl>
## 1 female 16.2
## 2 male 16.3
set.seed(123)
pop<-rnorm(10000, mean = 3.75, sd = 9)
samples<- matrix(sample(pop, size = 100*1000, replace = TRUE), nrow = 1000)
sample_means<- apply(samples, 1, mean)
hist(sample_means, breaks = 30, main = "Histogram of 100 Sample Means", xlab = "Sample Mean", col = "skyblue")