Librerias

library(readxl)
library(dplyr)
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(MASS)
## 
## Attaching package: 'MASS'
## The following object is masked from 'package:dplyr':
## 
##     select
library(ggplot2)

Importar datos

data<-read_excel('C:/Users/rusoc/OneDrive/Escritorio/TEC/Mineria de datos/Diet.xlsx')
str(data)
## tibble [78 × 4] (S3: tbl_df/tbl/data.frame)
##  $ gender      : chr [1:78] "M" "M" "F" "F" ...
##  $ Diet        : chr [1:78] "B" "B" "A" "A" ...
##  $ weight      : num [1:78] 60 103 58 60 64 64 65 66 67 69 ...
##  $ weight6weeks: num [1:78] 60 103 54.2 54 63.3 61.1 62.2 64 65 60.5 ...
table(data$Diet)
## 
##  A  B  C 
## 24 27 27

Vamos a crear una nueva columna para ver la perdida de peso que hubo en las 6 semanas.

data2 <- data%>% mutate(perdida_peso= data$weight-data$weight6weeks)
data2
## # A tibble: 78 × 5
##    gender Diet  weight weight6weeks perdida_peso
##    <chr>  <chr>  <dbl>        <dbl>        <dbl>
##  1 M      B         60         60          0    
##  2 M      B        103        103          0    
##  3 F      A         58         54.2        3.80 
##  4 F      A         60         54          6    
##  5 F      A         64         63.3        0.700
##  6 F      A         64         61.1        2.9  
##  7 F      A         65         62.2        2.80 
##  8 F      A         66         64          2    
##  9 F      A         67         65          2    
## 10 F      A         69         60.5        8.5  
## # ℹ 68 more rows
aggregate(perdida_peso~Diet, data = data2, FUN = mean)
##   Diet perdida_peso
## 1    A     3.300000
## 2    B     3.025926
## 3    C     5.148148

Creamos boxplox

ggplot(data = data2, aes(x=Diet, y=perdida_peso, color=Diet)) + geom_boxplot() + theme_bw()

anova = aov(data2$perdida_peso ~ data2$Diet)
summary(anova)
##             Df Sum Sq Mean Sq F value  Pr(>F)   
## data2$Diet   2   71.1   35.55   6.197 0.00323 **
## Residuals   75  430.2    5.74                   
## ---
## Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1

H0: σ1= σ2= σ3=…… σC = 0 (son iguales) H1: No todas las σj son 0 (no son iguales)

Resultado= Rechazamos la H0, el p-value es menor a 0.05