Analysis of Body Type with Gender

Nikitha Nair s3790431

Last updated: 27 October, 2019

Introduction

Introduction Cont.

Problem Statement

Data

Data Cont.

Descriptive Statistics and Visualisation

BODY_MEASUREMENTS <- read.csv("C:/Users/Niki/Desktop/Statistics/Assignment3/500-person-gender-height-weight-bodymassindex/500_Person_Gender_Height_Weight_Index.csv",stringsAsFactors = FALSE)
head(BODY_MEASUREMENTS)
summary(BODY_MEASUREMENTS)
##     Gender              Height          Weight        Index      
##  Length:500         Min.   :140.0   Min.   : 50   Min.   :0.000  
##  Class :character   1st Qu.:156.0   1st Qu.: 80   1st Qu.:3.000  
##  Mode  :character   Median :170.5   Median :106   Median :4.000  
##                     Mean   :169.9   Mean   :106   Mean   :3.748  
##                     3rd Qu.:184.0   3rd Qu.:136   3rd Qu.:5.000  
##                     Max.   :199.0   Max.   :160   Max.   :5.000
BODY_MEASUREMENTS= BODY_MEASUREMENTS %>% filter(BODY_MEASUREMENTS$Gender!='unknown') 
BODY_MEASUREMENTS$Gender <- factor(BODY_MEASUREMENTS$Gender, levels=c("Male","Female"), 
                            labels = c("MALE","FEMALE"))
BODY_MEASUREMENTS
BODY_MEASUREMENTS$Index <- factor(BODY_MEASUREMENTS$Index, levels=c("0","1","2","3","4","5"), 
                                   labels = c("Extremely Weak","Weak","Normal","Overweight","Obesity","Extreme Obesity"))
colSums(is.na(BODY_MEASUREMENTS))
## Gender Height Weight  Index 
##      0      0      0      0

Decsriptive Statistics Cont.

table(BODY_MEASUREMENTS$Index,BODY_MEASUREMENTS$Gender)
##                  
##                   MALE FEMALE
##   Extremely Weak     6      7
##   Weak              15      7
##   Normal            28     41
##   Overweight        32     36
##   Obesity           59     71
##   Extreme Obesity  105     93
BODYTYPE = table(BODY_MEASUREMENTS$Index,BODY_MEASUREMENTS$Gender) %>% prop.table()
barplot(BODYTYPE,main="Gender with BodyType",ylab="Different Body Type proportion With Gender",
        ylim=c(0,.6),
        legend=rownames(BODYTYPE),beside=TRUE,
        args.legend=c(x = "topright",horiz=FALSE,title="BODY TYPE"),xlab="Gender", col = brewer.pal(5, name = "Blues"))

Hypothesis Testing

CHI <- chisq.test(table(BODY_MEASUREMENTS$Index,BODY_MEASUREMENTS$Gender)) 
CHI
## 
##  Pearson's Chi-squared test
## 
## data:  table(BODY_MEASUREMENTS$Index, BODY_MEASUREMENTS$Gender)
## X-squared = 7.3085, df = 5, p-value = 0.1987
CHI$observed
##                  
##                   MALE FEMALE
##   Extremely Weak     6      7
##   Weak              15      7
##   Normal            28     41
##   Overweight        32     36
##   Obesity           59     71
##   Extreme Obesity  105     93
CHI$expected
##                  
##                    MALE FEMALE
##   Extremely Weak   6.37   6.63
##   Weak            10.78  11.22
##   Normal          33.81  35.19
##   Overweight      33.32  34.68
##   Obesity         63.70  66.30
##   Extreme Obesity 97.02 100.98
qchisq(p = .95,df = 5)
## [1] 11.0705
pchisq(q = 7.3085,df = 5,lower.tail = FALSE)
## [1] 0.1986891

Hypthesis Testing Cont.

Discussion

References