R Markdown

Question A

mydata<- read.table("Marathon.csv", header = TRUE, sep = ";", dec = ",")

head(mydata)
##   ID Weight Height Pressure Beat Hemoglobin Hematocrit Cholesterol Glucose
## 1  1     72  179.0      105   64        160         50         4.9     4.7
## 2  2     68  178.0      105   60        158         51         4.8     4.9
## 3  3     64  174.0      109   54        155         51         4.5     7.0
## 4  4     63  174.0      112   54        153         58         8.0     7.2
## 5  5     61  173.5      100   53        152         59         4.6     6.7
## 6  6     60  173.0       99   53        158         49         3.9     6.0
##   Gender
## 1      1
## 2      0
## 3      0
## 4      0
## 5      0
## 6      0

Question B

Question C

mean(mydata$Height)
## [1] 176.9571

Average height for people in the sample is, 176.96 cm.

sd(mydata$Height)
## [1] 5.85156

Standard deviation, which is a measure of variability, equals 5.85 cm. If assuming that hight is distiubted normally in people, then within 176.96 cm +- 5.85m 68.3% of people are expecred to be.

mydata$Gender<- factor(mydata$Gender, 
                       levels = c( 0,1 ),
                       labels = c ("F","M"))
library(psych)
describeBy(mydata$Glucose, mydata$Gender)
## 
##  Descriptive statistics by group 
## group: F
##    vars  n mean   sd median trimmed  mad min max range skew kurtosis   se
## X1    1 14 5.96 0.93    5.8    5.97 1.33 4.6 7.2   2.6 0.12    -1.62 0.25
## ------------------------------------------------------------ 
## group: M
##    vars  n mean  sd median trimmed  mad min max range skew kurtosis   se
## X1    1 21 4.54 0.7    4.6    4.45 0.74 3.8   6   2.2 0.97    -0.13 0.15

Question F

library(pastecs)
stat.desc(mydata[, -c(1,10)], -1)
##                  Weight       Height     Pressure        Beat   Hemoglobin
## median       68.0000000 177.00000000 108.00000000 55.00000000 157.00000000
## mean         67.8571429 176.95714286 109.65714286 56.20000000 155.57142857
## SE.mean       1.2984431   0.98909419   1.79258175  0.67213444   1.44552960
## CI.mean.0.95  2.6387538   2.01008124   3.64296442  1.36594153   2.93766959
## var          59.0084034  34.24075630 112.46722689 15.81176471  73.13445378
## std.dev       7.6816927   5.85156016  10.60505667  3.97640097   8.55186844
## coef.var      0.1132039   0.03306767   0.09671104  0.07075447   0.05497069
##               Hematocrit Cholesterol   Glucose
## median       51.00000000   4.7000000 4.8000000
## mean         51.45714286   4.7885714 5.1042857
## SE.mean       0.81924628   0.1692679 0.1786783
## CI.mean.0.95  1.66490875   0.3439938 0.3631180
## var          23.49075630   1.0028067 1.1174076
## std.dev       4.84672635   1.0014024 1.0570750
## coef.var      0.09418957   0.2091234 0.2070956