Kelompok 1 Analisis Multivariat Topik 5 (MANOVA) Sains Data 2023E
Dosen Pembimbing : Ike Fitriyaningsih, M.Si
# Load library
library(ggplot2)
## Warning: package 'ggplot2' was built under R version 4.4.2
library(corrplot)
## Warning: package 'corrplot' was built under R version 4.4.3
## corrplot 0.95 loaded
library(car)
## Warning: package 'car' was built under R version 4.4.3
## Loading required package: carData
## Warning: package 'carData' was built under R version 4.4.3
library(dplyr)
## Warning: package 'dplyr' was built under R version 4.4.2
##
## Attaching package: 'dplyr'
## The following object is masked from 'package:car':
##
## recode
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(MVN)
## Warning: package 'MVN' was built under R version 4.4.3
library(biotools)
## Warning: package 'biotools' was built under R version 4.4.3
## Loading required package: MASS
## Warning: package 'MASS' was built under R version 4.4.3
##
## Attaching package: 'MASS'
## The following object is masked from 'package:dplyr':
##
## select
## ---
## biotools version 4.3
# Load data
df <- read.csv("C:/Users/shoba/OneDrive/Dokumen/Annas/TUGAS KULIAH/SEMESTER 4/ANALISIS MULTIVARIAT/UAS/hasil_transformasi_log.csv", stringsAsFactors = TRUE)
# Konversi ke factor
df$Attrition <- as.factor(df$Attrition)
df$JobRole <- as.factor(df$JobRole)
# Subset data relevan
data_manova <- df[, c("Attrition", "JobRole", "Age_log",
"YearsWithCurrManager_log", "TotalWorkingYears_log", "YearsAtCompany_log")]
# Korelasi Pearson antar variabel dependen
dependent_vars <- df[, c("YearsWithCurrManager_log", "TotalWorkingYears_log", "YearsAtCompany_log")]
cor_matrix <- cor(dependent_vars, method = "pearson")
# Visualisasi korelasi
corrplot(cor_matrix, method = "color", addCoef.col = "black", tl.cex = 0.8, number.cex = 0.7)
# Distribusi Attrition
ggplot(df, aes(x = Attrition)) +
geom_bar(fill = "steelblue") +
ggtitle("Distribusi Attrition")
# Distribusi JobRole
ggplot(df, aes(y = JobRole)) +
geom_bar(fill = "darkgreen") +
ggtitle("Distribusi JobRole")
# Variabel numerik
num_cols <- c("YearsWithCurrManager_log", "TotalWorkingYears_log", "YearsAtCompany_log")
# Boxplot per variabel numerik
for (col in num_cols) {
p <- ggplot(df, aes_string(x = col)) +
geom_boxplot(fill = "tomato") +
ggtitle(paste("Boxplot", col)) +
theme_minimal()
print(p)
}
## Warning: `aes_string()` was deprecated in ggplot2 3.0.0.
## ℹ Please use tidy evaluation idioms with `aes()`.
## ℹ See also `vignette("ggplot2-in-packages")` for more information.
## This warning is displayed once every 8 hours.
## Call `lifecycle::last_lifecycle_warnings()` to see where this warning was
## generated.
# Model dummy untuk VIF
model_vif <- lm(YearsAtCompany_log ~ Attrition + JobRole, data = data_manova)
# Hitung VIF
vif(model_vif)
## GVIF Df GVIF^(1/(2*Df))
## Attrition 1.053785 1 1.02654
## JobRole 1.053785 8 1.00328
# Ambil variabel dependen
y_vars <- data_manova[, c("YearsWithCurrManager_log", "TotalWorkingYears_log", "YearsAtCompany_log")]
# Uji normalitas multivariat (Royston Test)
mvn(data = y_vars, mvnTest = "royston")
## $multivariateNormality
## Test H p value MVN
## 1 Royston 286.984 3.596275e-62 NO
##
## $univariateNormality
## Test Variable Statistic p value Normality
## 1 Anderson-Darling YearsWithCurrManager_log 41.2963 <0.001 NO
## 2 Anderson-Darling TotalWorkingYears_log 30.2756 <0.001 NO
## 3 Anderson-Darling YearsAtCompany_log 19.0728 <0.001 NO
##
## $Descriptives
## n Mean Std.Dev Median Min Max 25th
## YearsWithCurrManager_log 1253 1.262275 0.7765269 1.098612 0 2.708050 1.098612
## TotalWorkingYears_log 1253 2.123745 0.6082434 2.302585 0 3.091042 1.791759
## YearsAtCompany_log 1253 1.682448 0.6692273 1.791759 0 2.890372 1.098612
## 75th Skew Kurtosis
## YearsWithCurrManager_log 2.079442 -0.3306121 -0.9572467
## TotalWorkingYears_log 2.484907 -1.0514642 1.0581523
## YearsAtCompany_log 2.197225 -0.5473811 -0.3451232
# Uji Box’s M berdasarkan grup Attrition
boxM(y_vars, grouping = data_manova$Attrition)
##
## Box's M-test for Homogeneity of Covariance Matrices
##
## data: y_vars
## Chi-Sq (approx.) = 38.684, df = 6, p-value = 8.256e-07
# Scatterplot matrix untuk mengecek hubungan linear antar Y
pairs(y_vars, panel = panel.smooth, main = "Scatterplot Matrix - Linearitas")
# Buat model MANOVA
manova_model <- manova(cbind(YearsWithCurrManager_log, TotalWorkingYears_log, YearsAtCompany_log) ~
Attrition + JobRole, data = data_manova)
# Ringkasan hasil MANOVA
summary(manova_model, test = "Wilks")
## Df Wilks approx F num Df den Df Pr(>F)
## Attrition 1 0.92517 33.459 3 1241.0 < 2.2e-16 ***
## JobRole 8 0.77716 13.622 24 3599.9 < 2.2e-16 ***
## Residuals 1243
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
# 1. YearsWithCurrManager_log
aov_mgr <- aov(YearsWithCurrManager_log ~ JobRole, data = data_manova)
tukey_mgr <- TukeyHSD(aov_mgr, "JobRole")
print(tukey_mgr)
## Tukey multiple comparisons of means
## 95% family-wise confidence level
##
## Fit: aov(formula = YearsWithCurrManager_log ~ JobRole, data = data_manova)
##
## $JobRole
## diff lwr
## Human Resources-Healthcare Representative -0.17093286 -0.56782843
## Laboratory Technician-Healthcare Representative -0.23511538 -0.50425630
## Manager-Healthcare Representative -0.08639629 -0.65462039
## Manufacturing Director-Healthcare Representative 0.14796548 -0.16097201
## Research Director-Healthcare Representative 0.27621941 -0.17797620
## Research Scientist-Healthcare Representative -0.19371075 -0.45804049
## Sales Executive-Healthcare Representative 0.09169211 -0.17130153
## Sales Representative-Healthcare Representative -0.61650728 -0.95767704
## Laboratory Technician-Human Resources -0.06418251 -0.42232894
## Manager-Human Resources 0.08453657 -0.53085815
## Manufacturing Director-Human Resources 0.31889835 -0.07004175
## Research Director-Human Resources 0.44715228 -0.06482984
## Research Scientist-Human Resources -0.02277788 -0.37732301
## Sales Executive-Human Resources 0.26262498 -0.09092514
## Sales Representative-Human Resources -0.44557441 -0.86057904
## Manager-Laboratory Technician 0.14871908 -0.39314936
## Manufacturing Director-Laboratory Technician 0.38308086 0.12581611
## Research Director-Laboratory Technician 0.51133479 0.09057781
## Research Scientist-Laboratory Technician 0.04140463 -0.16012204
## Sales Executive-Laboratory Technician 0.32680749 0.12703653
## Sales Representative-Laboratory Technician -0.38139190 -0.67658606
## Manufacturing Director-Manager 0.23436178 -0.32833436
## Research Director-Manager 0.36261571 -0.29120248
## Research Scientist-Manager -0.10731445 -0.64680939
## Sales Executive-Manager 0.17808841 -0.36075315
## Sales Representative-Manager -0.53011098 -1.11112852
## Research Director-Manufacturing Director 0.12825393 -0.31900659
## Research Scientist-Manufacturing Director -0.34167623 -0.59390337
## Sales Executive-Manufacturing Director -0.05627337 -0.30709994
## Sales Representative-Manufacturing Director -0.76447276 -1.09635395
## Research Scientist-Research Director -0.46993016 -0.88762600
## Sales Executive-Research Director -0.18452730 -0.60137890
## Sales Representative-Research Director -0.89272669 -1.36282924
## Sales Executive-Research Scientist 0.28540286 0.09216256
## Sales Representative-Research Scientist -0.42279653 -0.71361085
## Sales Representative-Sales Executive -0.70819939 -0.99779982
## upr p adj
## Human Resources-Healthcare Representative 0.22596270 0.9197163
## Laboratory Technician-Healthcare Representative 0.03402555 0.1436848
## Manager-Healthcare Representative 0.48182780 0.9999356
## Manufacturing Director-Healthcare Representative 0.45690297 0.8612000
## Research Director-Healthcare Representative 0.73041503 0.6210805
## Research Scientist-Healthcare Representative 0.07061900 0.3568647
## Sales Executive-Healthcare Representative 0.35468575 0.9766103
## Sales Representative-Healthcare Representative -0.27533751 0.0000009
## Laboratory Technician-Human Resources 0.29396392 0.9997765
## Manager-Human Resources 0.69993129 0.9999705
## Manufacturing Director-Human Resources 0.70783845 0.2103729
## Research Director-Human Resources 0.95913439 0.1439027
## Research Scientist-Human Resources 0.33176725 0.9999999
## Sales Executive-Human Resources 0.61617509 0.3378407
## Sales Representative-Human Resources -0.03056978 0.0245682
## Manager-Laboratory Technician 0.69058752 0.9951391
## Manufacturing Director-Laboratory Technician 0.64034561 0.0001420
## Research Director-Laboratory Technician 0.93209177 0.0052262
## Research Scientist-Laboratory Technician 0.24293130 0.9993831
## Sales Executive-Laboratory Technician 0.52657845 0.0000151
## Sales Representative-Laboratory Technician -0.08619774 0.0020573
## Manufacturing Director-Manager 0.79705791 0.9331706
## Research Director-Manager 1.01643390 0.7321371
## Research Scientist-Manager 0.43218049 0.9995139
## Sales Executive-Manager 0.71692997 0.9833046
## Sales Representative-Manager 0.05090656 0.1063304
## Research Director-Manufacturing Director 0.57551445 0.9934465
## Research Scientist-Manufacturing Director -0.08944908 0.0009178
## Sales Executive-Manufacturing Director 0.19455320 0.9988282
## Sales Representative-Manufacturing Director -0.43259156 0.0000000
## Research Scientist-Research Director -0.05223432 0.0143909
## Sales Executive-Research Director 0.23232430 0.9070256
## Sales Representative-Research Director -0.42262413 0.0000002
## Sales Executive-Research Scientist 0.47864316 0.0001692
## Sales Representative-Research Scientist -0.13198220 0.0002355
## Sales Representative-Sales Executive -0.41859896 0.0000000
# 2. TotalWorkingYears_log
aov_total <- aov(TotalWorkingYears_log ~ JobRole, data = data_manova)
tukey_total <- TukeyHSD(aov_total, "JobRole")
print(tukey_total)
## Tukey multiple comparisons of means
## 95% family-wise confidence level
##
## Fit: aov(formula = TotalWorkingYears_log ~ JobRole, data = data_manova)
##
## $JobRole
## diff lwr
## Human Resources-Healthcare Representative -0.42917602 -0.712159016
## Laboratory Technician-Healthcare Representative -0.54579668 -0.737691765
## Manager-Healthcare Representative 0.27732115 -0.127817576
## Manufacturing Director-Healthcare Representative -0.11437378 -0.334643461
## Research Director-Healthcare Representative 0.21186279 -0.111974642
## Research Scientist-Healthcare Representative -0.51410423 -0.702568989
## Sales Executive-Healthcare Representative -0.15916546 -0.346677580
## Sales Representative-Healthcare Representative -1.04015704 -1.283408044
## Laboratory Technician-Human Resources -0.11662067 -0.371975884
## Manager-Human Resources 0.70649716 0.267726210
## Manufacturing Director-Human Resources 0.31480223 0.037491405
## Research Director-Human Resources 0.64103880 0.276000113
## Research Scientist-Human Resources -0.08492821 -0.337715733
## Sales Executive-Human Resources 0.27001056 0.017932475
## Sales Representative-Human Resources -0.61098102 -0.906875625
## Manager-Laboratory Technician 0.82311783 0.436770456
## Manufacturing Director-Laboratory Technician 0.43142290 0.247995422
## Research Director-Laboratory Technician 0.75765947 0.457663488
## Research Scientist-Laboratory Technician 0.03169245 -0.111994268
## Sales Executive-Laboratory Technician 0.38663123 0.244196312
## Sales Representative-Laboratory Technician -0.49436035 -0.704831162
## Manufacturing Director-Manager -0.39169493 -0.792892264
## Research Director-Manager -0.06545836 -0.531624908
## Research Scientist-Manager -0.79142538 -1.176080463
## Sales Executive-Manager -0.43648660 -0.820675836
## Sales Representative-Manager -1.31747818 -1.731738515
## Research Director-Manufacturing Director 0.32623657 0.007343802
## Research Scientist-Manufacturing Director -0.39973045 -0.579566156
## Sales Executive-Manufacturing Director -0.04479167 -0.223628788
## Sales Representative-Manufacturing Director -0.92578325 -1.162411590
## Research Scientist-Research Director -0.72596702 -1.023780432
## Sales Executive-Research Director -0.37102824 -0.668239719
## Sales Representative-Research Director -1.25201982 -1.587198756
## Sales Executive-Research Scientist 0.35493877 0.217160158
## Sales Representative-Research Scientist -0.52605281 -0.733400830
## Sales Representative-Sales Executive -0.88099158 -1.087474107
## upr p adj
## Human Resources-Healthcare Representative -0.146193017 0.0000947
## Laboratory Technician-Healthcare Representative -0.353901601 0.0000000
## Manager-Healthcare Representative 0.682459868 0.4552212
## Manufacturing Director-Healthcare Representative 0.105895894 0.7975895
## Research Director-Healthcare Representative 0.535700213 0.5205237
## Research Scientist-Healthcare Representative -0.325639474 0.0000000
## Sales Executive-Healthcare Representative 0.028346664 0.1721905
## Sales Representative-Healthcare Representative -0.796906032 0.0000000
## Laboratory Technician-Human Resources 0.138734551 0.8906316
## Manager-Human Resources 1.145268114 0.0000227
## Manufacturing Director-Human Resources 0.592113061 0.0129017
## Research Director-Human Resources 1.006077490 0.0000021
## Research Scientist-Human Resources 0.167859303 0.9814676
## Sales Executive-Human Resources 0.522088643 0.0252013
## Sales Representative-Human Resources -0.315086418 0.0000000
## Manager-Laboratory Technician 1.209465202 0.0000000
## Manufacturing Director-Laboratory Technician 0.614850378 0.0000000
## Research Director-Laboratory Technician 1.057655448 0.0000000
## Research Scientist-Laboratory Technician 0.175379172 0.9989641
## Sales Executive-Laboratory Technician 0.529066139 0.0000000
## Sales Representative-Laboratory Technician -0.283889547 0.0000000
## Manufacturing Director-Manager 0.009502405 0.0619265
## Research Director-Manager 0.400708186 0.9999650
## Research Scientist-Manager -0.406770292 0.0000000
## Sales Executive-Manager -0.052297372 0.0127727
## Sales Representative-Manager -0.903217852 0.0000000
## Research Director-Manufacturing Director 0.645129335 0.0403321
## Research Scientist-Manufacturing Director -0.219894740 0.0000000
## Sales Executive-Manufacturing Director 0.134045439 0.9974281
## Sales Representative-Manufacturing Director -0.689154919 0.0000000
## Research Scientist-Research Director -0.428153601 0.0000000
## Sales Executive-Research Director -0.073816767 0.0035233
## Sales Representative-Research Director -0.916840889 0.0000000
## Sales Executive-Research Scientist 0.492717389 0.0000000
## Sales Representative-Research Scientist -0.318704783 0.0000000
## Sales Representative-Sales Executive -0.674509053 0.0000000
# 3. YearsAtCompany_log
aov_company <- aov(YearsAtCompany_log ~ JobRole, data = data_manova)
tukey_company <- TukeyHSD(aov_company, "JobRole")
print(tukey_company)
## Tukey multiple comparisons of means
## 95% family-wise confidence level
##
## Fit: aov(formula = YearsAtCompany_log ~ JobRole, data = data_manova)
##
## $JobRole
## diff lwr
## Human Resources-Healthcare Representative -0.179473386 -0.51674090
## Laboratory Technician-Healthcare Representative -0.320457696 -0.54916393
## Manager-Healthcare Representative -0.044252901 -0.52710922
## Manufacturing Director-Healthcare Representative 0.030186772 -0.23233715
## Research Director-Healthcare Representative 0.190758834 -0.19520020
## Research Scientist-Healthcare Representative -0.263114370 -0.48773225
## Sales Executive-Healthcare Representative 0.034032976 -0.18944952
## Sales Representative-Healthcare Representative -0.675725723 -0.96563947
## Laboratory Technician-Human Resources -0.140984310 -0.44532422
## Manager-Human Resources 0.135220485 -0.38771972
## Manufacturing Director-Human Resources 0.209660158 -0.12084710
## Research Director-Human Resources 0.370232220 -0.06483169
## Research Scientist-Human Resources -0.083640984 -0.38492063
## Sales Executive-Human Resources 0.213506363 -0.08692776
## Sales Representative-Human Resources -0.496252336 -0.84890828
## Manager-Laboratory Technician 0.276204795 -0.18425544
## Manufacturing Director-Laboratory Technician 0.350644467 0.13203017
## Research Director-Laboratory Technician 0.511216530 0.15367244
## Research Scientist-Laboratory Technician 0.057343325 -0.11390676
## Sales Executive-Laboratory Technician 0.354490672 0.18473253
## Sales Representative-Laboratory Technician -0.355268027 -0.60611336
## Manufacturing Director-Manager 0.074439673 -0.40371919
## Research Director-Manager 0.235011735 -0.32057935
## Research Scientist-Manager -0.218861469 -0.67730479
## Sales Executive-Manager 0.078285878 -0.37960222
## Sales Representative-Manager -0.631472822 -1.12520055
## Research Director-Manufacturing Director 0.160572063 -0.21949378
## Research Scientist-Manufacturing Director -0.293301142 -0.50763466
## Sales Executive-Manufacturing Director 0.003846205 -0.20929716
## Sales Representative-Manufacturing Director -0.705912494 -0.98793315
## Research Scientist-Research Director -0.453873205 -0.80881605
## Sales Executive-Research Director -0.156725858 -0.51095129
## Sales Representative-Research Director -0.866484557 -1.26596073
## Sales Executive-Research Scientist 0.297147347 0.13293871
## Sales Representative-Research Scientist -0.412611352 -0.65973486
## Sales Representative-Sales Executive -0.709758699 -0.95585069
## upr p adj
## Human Resources-Healthcare Representative 0.15779413 0.7746607
## Laboratory Technician-Healthcare Representative -0.09175146 0.0004908
## Manager-Healthcare Representative 0.43860342 0.9999987
## Manufacturing Director-Healthcare Representative 0.29271069 0.9999926
## Research Director-Healthcare Representative 0.57671787 0.8385656
## Research Scientist-Healthcare Representative -0.03849649 0.0086532
## Sales Executive-Healthcare Representative 0.25751547 0.9999349
## Sales Representative-Healthcare Representative -0.38581197 0.0000000
## Laboratory Technician-Human Resources 0.16335560 0.8824082
## Manager-Human Resources 0.65816069 0.9967831
## Manufacturing Director-Human Resources 0.54016741 0.5639844
## Research Director-Human Resources 0.80529613 0.1695560
## Research Scientist-Human Resources 0.21763866 0.9947421
## Sales Executive-Human Resources 0.51394048 0.4008358
## Sales Representative-Human Resources -0.14359639 0.0004520
## Manager-Laboratory Technician 0.73666503 0.6389447
## Manufacturing Director-Laboratory Technician 0.56925877 0.0000251
## Research Director-Laboratory Technician 0.86876062 0.0003304
## Research Scientist-Laboratory Technician 0.22859341 0.9818546
## Sales Executive-Laboratory Technician 0.52424882 0.0000000
## Sales Representative-Laboratory Technician -0.10442269 0.0003987
## Manufacturing Director-Manager 0.55259853 0.9999229
## Research Director-Manager 0.79060282 0.9272106
## Research Scientist-Manager 0.23958185 0.8633832
## Sales Executive-Manager 0.53617398 0.9998431
## Sales Representative-Manager -0.13774510 0.0024205
## Research Director-Manufacturing Director 0.54063790 0.9276903
## Research Scientist-Manufacturing Director -0.07896762 0.0007641
## Sales Executive-Manufacturing Director 0.21698957 1.0000000
## Sales Representative-Manufacturing Director -0.42389184 0.0000000
## Research Scientist-Research Director -0.09893036 0.0024285
## Sales Executive-Research Director 0.19749958 0.9072720
## Sales Representative-Research Director -0.46700838 0.0000000
## Sales Executive-Research Scientist 0.46135598 0.0000008
## Sales Representative-Research Scientist -0.16548784 0.0000088
## Sales Representative-Sales Executive -0.46366671 0.0000000