library(tidyverse)
## Warning: package 'ggplot2' was built under R version 4.0.4
library(openintro)

Load the youth risk dataset

CSV file: https://vincentarelbundock.github.io/Rdatasets/csv/Stat2Data/YouthRisk2009.csv

library(tidyverse)
setwd("C:/AarynZimmerman/Biostatistics Project")
youth <-read.csv("YouthRisk2009.csv")
#view the data
glimpse(youth)
## Rows: 500
## Columns: 7
## $ X           <int> 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, ...
## $ Sleep       <chr> "", "8 hours", "5 hours", "5 hours", "7 hours", "4 or l...
## $ Sleep7      <int> NA, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, ...
## $ SmokeLife   <chr> "No", "Yes", "Yes", "Yes", "Yes", "No", "No", "No", "Ye...
## $ SmokeDaily  <chr> "", "Yes", "Yes", "Yes", "No", "No", "No", "No", "No", ...
## $ MarijuaEver <int> 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1...
## $ Age         <int> 16, 16, 17, 18, 17, 15, 17, 17, 16, 16, 18, 15, 15, 16,...
view(youth)

LS0tDQp0aXRsZTogIllvdXRoIFJpc2sgQmVoYXZpb3IiDQphdXRob3I6ICJBYXJ5biBaaW1tZXJtYW4iDQpkYXRlOiAiYHIgU3lzLkRhdGUoKWAiDQpvdXRwdXQ6IG9wZW5pbnRybzo6bGFiX3JlcG9ydA0KLS0tDQoNCmBgYHtyIGxvYWQtcGFja2FnZXMsIG1lc3NhZ2U9RkFMU0V9DQpsaWJyYXJ5KHRpZHl2ZXJzZSkNCmxpYnJhcnkob3BlbmludHJvKQ0KYGBgDQoNCiMjIyBMb2FkIHRoZSB5b3V0aCByaXNrIGRhdGFzZXQNCiMjIyBTb3VyY2U6IGh0dHBzOi8vdmluY2VudGFyZWxidW5kb2NrLmdpdGh1Yi5pby9SZGF0YXNldHMvZG9jL1N0YXQyRGF0YS9Zb3V0aFJpc2syMDA5Lmh0bWwNCiMjIyBDU1YgZmlsZTogIGh0dHBzOi8vdmluY2VudGFyZWxidW5kb2NrLmdpdGh1Yi5pby9SZGF0YXNldHMvY3N2L1N0YXQyRGF0YS9Zb3V0aFJpc2syMDA5LmNzdg0KDQoNCg0KYGBge3IgY29kZS1jaHVuay1sYWJlbH0NCmxpYnJhcnkodGlkeXZlcnNlKQ0Kc2V0d2QoIkM6L0FhcnluWmltbWVybWFuL0Jpb3N0YXRpc3RpY3MgUHJvamVjdCIpDQp5b3V0aCA8LXJlYWQuY3N2KCJZb3V0aFJpc2syMDA5LmNzdiIpDQpgYGANCmBgYHtyfQ0KI3ZpZXcgdGhlIGRhdGENCmdsaW1wc2UoeW91dGgpDQoNCmBgYA0KYGBge3J9DQp2aWV3KHlvdXRoKQ0KYGBgDQoNCg0KLi4uDQoNCg==