Please create an Rmd file and an html file by using the above R codes (Q16) (Put your name for “Author”)
setwd("~/UB/CEP525/FinalExam")
data <- read.csv("yrbs2019.csv")
df <- data[, c(1:5, 100:122)]
colnames(df) <- tolower(colnames(df))
str(df)
## 'data.frame': 13677 obs. of 28 variables:
## $ q1 : chr "16 years old" "15 years old" "15 years old" "15 years old" ...
## $ q2 : chr "Male" "Male" "Female" "Male" ...
## $ q3 : chr "10th grade" "10th grade" "10th grade" "10th grade" ...
## $ q4 : chr "Yes" "No" "No" "No" ...
## $ q5 : chr "A" "A D" " B E" " E" ...
## $ qn8 : int 2 2 2 2 2 2 2 2 2 1 ...
## $ qn9 : int 2 1 2 2 2 2 2 2 1 2 ...
## $ qn10: int 2 2 2 NA NA NA 2 NA NA 2 ...
## $ qn11: int 2 2 2 NA NA NA 1 NA NA 1 ...
## $ qn12: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn13: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn14: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn15: int 2 2 2 2 2 1 2 2 2 2 ...
## $ qn16: int 2 2 2 2 2 2 2 1 2 2 ...
## $ qn17: int 2 2 2 2 2 2 1 2 2 1 ...
## $ qn18: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn19: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn20: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn21: int 2 2 NA 2 NA NA 2 2 2 2 ...
## $ qn22: int 2 2 NA 2 NA NA 2 2 2 2 ...
## $ qn23: int 2 1 2 2 2 1 1 NA 1 2 ...
## $ qn24: int 2 2 2 2 2 2 2 NA 1 2 ...
## $ qn25: int 2 2 2 1 2 1 1 NA 1 1 ...
## $ qn26: int 2 2 2 2 2 1 1 NA 1 2 ...
## $ qn27: int 2 2 2 2 2 1 1 NA 1 2 ...
## $ qn28: int 2 2 2 2 2 2 1 NA 2 2 ...
## $ qn29: int 2 2 2 2 2 2 2 2 2 2 ...
## $ qn30: int 2 2 2 1 2 2 2 2 2 2 ...
dim(df)
## [1] 13677 28
#df$q1[df$q1 == ""] <- NA
#df$q2[df$q2 == ""] <- NA
#df$q3[df$q3 == ""] <- NA
#df$q4[df$q4 == ""] <- NA
#df$q5[df$q5 == ""] <- NA
df[, 1:5][df[,1:5] == ""] <- NA
df[,1:5] <- lapply(df[,1:5], factor)
summary(df[, 1:5])
## q1 q2 q3
## 16 years old :3628 Female:6885 10th grade :3717
## 15 years old :3473 Male :6641 11th grade :3322
## 17 years old :3102 NA's : 151 12th grade :2850
## 14 years old :1699 9th grade :3637
## 18 years old or older:1616 Ungraded or other grade: 39
## (Other) : 87 NA's : 112
## NA's : 72
## q4 q5
## No :10342 E :8000
## Yes : 3044 C :2279
## NA's: 291 :1245
## B : 672
## A : 385
## C E : 261
## (Other): 835