library(dplyr)
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(ggplot2)

Data Prep

NHIS_DATA<-read.csv("C:/Users/12055/Downloads/SD4 NHIS Data ALT.csv")
NHIS_Data<-NHIS_DATA%>%
  mutate(K6= ifelse(K6>=99, NA,
         ifelse(K6<5,"Low Risk",
                   ifelse(K6>=5 & K6<13,"Moderate Risk", NA 
                   ))),
sexorien= ifelse(sexorien==1,"GayOrLesbian",
                ifelse(sexorien==2,"Straight",
                       ifelse(sexorien==3, "Bisexual",
                              ifelse(sexorien==4, "Other", NA)))),
health= ifelse(health==1, "Excellent",
                        ifelse(health==2, "Very Good",
                ifelse(health==3,"Good",
                        ifelse(health==4,"Fair",NA
                        )))),
 health=factor(health, levels=c("Excellent", "Very Good", "Good", "Fair", "Poor")))%>%
  rename(K6Category= K6) 

Mean K6 Score

NHIS_DATA%>%
  filter(!is.na(health))%>%
 summarize(averageK6=mean(K6))
##   averageK6
## 1  6.266265

Percent health & sexual orientation

NHIS_Data=na.omit(NHIS_Data)

table(NHIS_Data$health)%>%
  prop.table()
## 
## Excellent Very Good      Good      Fair      Poor 
## 0.2728631 0.3398502 0.2811228 0.1061639 0.0000000
table(NHIS_Data$sexorien)%>%
  prop.table()
## 
##     Bisexual GayOrLesbian        Other     Straight 
##  0.008097341  0.016584394  0.002976964  0.972341301