Tutorial:https://github.com/immerse-ucsb/lca_enum Package:https://cran.r-project.org/web/packages/MplusAutomation/index.html ————————————————————————

#DATA ##Load packages

##Variable LPA RESS = ress_rum, ress_eng, ress_reap, ress_sup, ress_rel, ress_dis average frequency of use of each strategy (average of 4 items per strategy)

##Prepare Data

# Load your dataset
getwd()
[1] "C:/Users/Lenovo/Documents/data"

#Descriptive Analysis

Descriptive Statistics for Continuous Variables
Variable N Mean SD Min Max Median
ress_rum 244 4.34 1.51 1 7.00 4.50
ress_eng 244 2.73 1.18 1 6.25 2.50
ress_reap 244 3.75 1.33 1 7.00 3.75
ress_sup 244 4.12 1.64 1 7.00 4.00
ress_rel 244 3.36 1.54 1 7.00 3.25
ress_dis 244 4.18 1.63 1 7.00 4.25
descriptives_table <- purrr::map_dfr(
  c("ress_rum", "ress_eng", "ress_reap", "ress_sup", "ress_rel", "ress_dis"),
  ~ df_ress %>%
    summarise(
      variable = .x,
      n    = sum(!is.na(.data[[.x]])),
      mean = mean(.data[[.x]], na.rm = TRUE),
      sd   = sd(.data[[.x]], na.rm = TRUE),
      min  = min(.data[[.x]], na.rm = TRUE),
      max  = max(.data[[.x]], na.rm = TRUE),
      med  = median(.data[[.x]], na.rm = TRUE)
    )
) %>%
  dplyr::mutate(
    dplyr::across(
      c(mean, sd, min, max, med),
      ~ round(.x, 2)
    )
  ) %>%
  gt::gt(rowname_col = "variable") %>%
  gt::tab_stubhead(label = md("*Variable*")) %>%
  gt::tab_header(
    md("Descriptive Statistics for Continuous Variables")
  ) %>%
  gt::cols_label(
    n    = md("*N*"),
    mean = md("*Mean*"),
    sd   = md("*SD*"),
    min  = md("*Min*"),
    max  = md("*Max*"),
    med  = md("*Median*")
  )

# Display table
descriptives_table


# Save table as image
gtsave(descriptives_table, here::here("figures", "descriptives_table.png"))

#NUMERATION

IMPORTANT: Before moving forward, make sure to open each output document to ensure models were estimated normally. Review: files> data>enum los output (.out) revisar que no salga error (warning esta bien), que el n muestral es correcto y que diga “THE MODEL ESTIMATION TERMINATED NORMALLY”

Model Fit Summary Table1
Classes Par LL BIC aBIC CAIC AWE BLRT VLMR BF cmPk
1-Class 12 −2,630.01 5,325.99 5,287.95 5,337.99 5,427.96 0.00 <.001
2-Class 19 −2,545.99 5,196.43 5,136.20 5,215.43 5,357.88 <.001 <.001 0.00 <.001
3-Class 26 −2,515.47 5,173.86 5,091.44 5,199.86 5,394.78 <.001 0.14 0.00 <.001
4-Class 33 −2,485.63 5,152.66 5,048.05 5,185.66 5,433.07 <.001 0.24 0.14 0.12
5-Class 40 −2,464.42 5,148.73 5,021.93 5,188.73 5,488.61 <.001 0.10 >100 0.88
6-Class 47 −2,451.95 5,162.26 5,013.28 5,209.26 5,561.63 0.02 0.65 0.00
1 Note. Par = Parameters; LL = model log likelihood; BIC = Bayesian information criterion; aBIC = sample size adjusted BIC; CAIC = consistent Akaike information criterion; AWE = approximate weight of evidence criterion; BLRT = bootstrapped likelihood ratio test p-value; VLMR = Vuong-Lo-Mendell-Rubin adjusted likelihood ratio test p-value; cmPk = approximate correct model probability.

##Information Criteria Plot

#LPA

p3 <- plot_lpa(output_ress$c3_ress.out)
p3
ggsave(filename = here::here("figures", "plot_3ps.png"),plot = p3, dpi = 300,
  height = 6, width = 9, units = "in")


p4 <- plot_lpa(output_ress$c4_ress.out)
p4

ggsave(filename = here::here("figures", "plot_4ps.png"),plot = p4, dpi = 300,
  height = 6, width = 9, units = "in")



p5 <- plot_lpa(output_ress$c5_ress.out)
p5
ggsave(filename = here::here("figures", "plot_5ps.png"),plot = p5, dpi = 300,
  height = 6, width = 9, units = "in")



p6 <- plot_lpa(output_ress$c6_ress.out)
p6
ggsave(filename = here::here("figures", "plot_6ps.png"),plot = p6, dpi = 300,
  height = 6, width = 9, units = "in")

---
title: "LPA Classification-Mplus Atomation"
output:
  html_notebook: default
---
Tutorial:https://github.com/immerse-ucsb/lca_enum
Package:https://cran.r-project.org/web/packages/MplusAutomation/index.html
------------------------------------------------------------------------

#DATA 
##Load packages

```{r}
library(tidyverse)
library(haven)
library(glue)
library(MplusAutomation)
library(here)
library(janitor)
library(gt)
library(cowplot)
library(DiagrammeR)
library(readxl)
here::i_am("LPA_ress.Rmd")
```

##Variable LPA RESS = ress_rum, ress_eng, ress_reap, ress_sup, ress_rel, ress_dis average frequency of use of each strategy (average of 4 items per strategy)

##Prepare Data
```{r}
# Load your dataset
getwd()
setWindowTitle("C:/Users/Lenovo/Desktop")
base <- read_excel("C:/Users/Lenovo/Desktop/base.xlsx")
names(base)

# Set up data
df_ress <- readxl::read_excel(here::here("base.xlsx")) %>%
janitor::clean_names() %>%
dplyr::select(ress_rum, ress_eng, ress_reap, ress_sup, ress_rel, ress_dis)
```

#Descriptive Analysis
```{r}
# Compute descriptive statistics for continuous variables and format as gt table
# Compute descriptive statistics for continuous variables and format as gt table
descriptives_table <- purrr::map_dfr(
  c("ress_rum", "ress_eng", "ress_reap", "ress_sup", "ress_rel", "ress_dis"),
  ~ df_ress %>%
    summarise(
      variable = .x,
      n    = sum(!is.na(.data[[.x]])),
      mean = mean(.data[[.x]], na.rm = TRUE),
      sd   = sd(.data[[.x]], na.rm = TRUE),
      min  = min(.data[[.x]], na.rm = TRUE),
      max  = max(.data[[.x]], na.rm = TRUE),
      med  = median(.data[[.x]], na.rm = TRUE)
    )
) %>%
  dplyr::mutate(
    dplyr::across(
      c(mean, sd, min, max, med),
      ~ round(.x, 2)
    )
  ) %>%
  gt::gt(rowname_col = "variable") %>%
  gt::tab_stubhead(label = md("*Variable*")) %>%
  gt::tab_header(
    md("Descriptive Statistics for Continuous Variables")
  ) %>%
  gt::cols_label(
    n    = md("*N*"),
    mean = md("*Mean*"),
    sd   = md("*SD*"),
    min  = md("*Min*"),
    max  = md("*Max*"),
    med  = md("*Median*")
  )

# Display table
descriptives_table

# Save table as image
gtsave(descriptives_table, here::here("figures", "descriptives_table.png"))

```


#NUMERATION

```{r}
# Fit 1- through 6-class LPA models using Mplus and MplusAutomation
lca_6 <- lapply(1:6, function(k) {

  lca_enum <- mplusObject(
    TITLE = glue("{k}-Class"),

    VARIABLE = glue(
      "usevar = ress_rum ress_eng ress_reap ress_sup ress_rel ress_dis;
       classes = c({k}); "
    ),

    ANALYSIS =
      "estimator = mlr;
       type = mixture;
       starts = 200 100;
       processors = 10;",

    OUTPUT = "sampstat residual tech11 tech14;",

    PLOT =
      "type = plot3;
       series = ress_rum-ress_dis(*);",

    usevariables = colnames(df_ress),
    rdata = df_ress
  )

  lca_enum_fit <- mplusModeler(
    lca_enum,
    dataout  = glue::glue(here::here("enum", "ress.dat")),
    modelout = glue::glue(here::here("enum", "c{k}_ress.inp")),
    check = TRUE,
    run = TRUE,
    hashfilename = FALSE
  )

})

```

IMPORTANT: Before moving forward, make sure to open each output document to ensure models were estimated normally.
Review: files> data>enum los output (.out)
revisar que no salga error (warning esta bien), que el n muestral es correcto y que diga "THE MODEL ESTIMATION TERMINATED NORMALLY"


```{r}
# Extract Data
output_ress <- readModels(
  here::here("enum"),
  filefilter = "ress",
  quiet = TRUE
)

enum_extract <- LatexSummaryTable(
  output_ress,
  keepCols = c(
    "Title",
    "Parameters",
    "LL",
    "BIC",
    "aBIC",
    "BLRT_PValue",
    "T11_VLMR_PValue",
    "Observations"
  ),
  sortBy = "Title"
)

allFit <- enum_extract %>%
  mutate(CAIC = -2 * LL + Parameters * (log(Observations) + 1)) %>%
  mutate(AWE  = -2 * LL + 2 * Parameters * (log(Observations) + 1.5)) %>%
  mutate(SIC  = -.5 * BIC) %>%
  mutate(expSIC = exp(SIC - max(SIC))) %>%
  mutate(BF   = exp(SIC - lead(SIC))) %>%
  mutate(cmPk = expSIC / sum(expSIC)) %>%
  dplyr::select(1:5, 9:10, 6:7, 13, 14) %>% 
  arrange(Parameters)

#Table Fit
fit_table1 <- allFit %>%
  gt() %>%
  tab_header(title = md("**Model Fit Summary Table**")) %>%
  cols_label(
    Title       = "Classes",
    Parameters  = md("Par"),
    LL          = md("*LL*"),
    T11_VLMR_PValue = "VLMR",
    BLRT_PValue     = "BLRT",
    BF          = md("BF"),
    cmPk        = md("*cmPk*")
  ) %>%
  tab_footnote(
    footnote = md(
"*Note.* Par = Parameters; *LL* = model log likelihood;
BIC = Bayesian information criterion;
aBIC = sample size adjusted BIC; CAIC = consistent Akaike information criterion;
AWE = approximate weight of evidence criterion;
BLRT = bootstrapped likelihood ratio test p-value;
VLMR = Vuong-Lo-Mendell-Rubin adjusted likelihood ratio test p-value;
*cmPk* = approximate correct model probability."
    ),
    locations = cells_title()
  ) %>%
  tab_options(column_labels.font.weight = "bold") %>%
  fmt_number(c(3:7), decimals = 2) %>%
  sub_missing(1:11, missing_text = "--") %>%
  fmt(
    c(8:9, 11),
    fns = function(x)
      ifelse(x < 0.001, "<.001",
             scales::number(x, accuracy = .01))
  ) %>%
  fmt(
    10,
    fns = function (x)
      ifelse(x > 100, ">100",
             scales::number(x, accuracy = .01))
  ) %>%  
  tab_style(
    style = list(
      cell_text(weight = "bold")
    ),
    locations = list(
      cells_body(columns = BIC,  row = BIC  == min(BIC[1:6])),
      cells_body(columns = aBIC, row = aBIC == min(aBIC[1:6])),
      cells_body(columns = CAIC, row = CAIC == min(CAIC[1:6])),
      cells_body(columns = AWE,  row = AWE  == min(AWE[1:6])),
      cells_body(columns = cmPk, row = cmPk == max(cmPk[1:6])),
      cells_body(columns = BF,   row = BF > 10),
      cells_body(
        columns = T11_VLMR_PValue,
        row = ifelse(T11_VLMR_PValue < .05 & lead(T11_VLMR_PValue) > .05,
                     T11_VLMR_PValue < .05, NA)
      ),
      cells_body(
        columns = BLRT_PValue,
        row = ifelse(BLRT_PValue < .05 & lead(BLRT_PValue) > .05,
                     BLRT_PValue < .05, NA)
      )
    )
  )

fit_table1

#save table
gtsave(fit_table1, here::here("figures", "fit_table1.png"))


```

##Information Criteria Plot


```{r}
# Extract class-specific MEANS for each model (K = 1 to 6)
model_results <- data.frame()

for (i in 1:length(output_ress)) {
  
  temp <- output_ress[[i]]$parameters$unstandardized %>%
    # Keep only RESS indicators AND ONLY MEANS
    dplyr::filter(
      param %in% c(
        "RESS_RUM", "RESS_ENG", "RESS_REAP",
        "RESS_SUP", "RESS_REL", "RESS_DIS"
      ),
      paramHeader == "Means"     # ★ IMPORTANT FIX ★
    ) %>%
    mutate(model = paste(i, "-Class Model"))
  
  model_results <- rbind(model_results, temp)
}

rm(temp)

# Prepare data for comparison plot
compare_plot <- model_results %>%
  dplyr::select(est, model, LatentClass, param) %>%
  mutate(
    LatentClass = factor(LatentClass),     # better legend handling
    param = tolower(param),
    param = factor(
      param,
      levels = c(
        "ress_rum", "ress_eng", "ress_reap",
        "ress_sup", "ress_rel", "ress_dis"
      )
    )
  )

# Plot class means across models
compare_figure <- ggplot(
  compare_plot,
  aes(
    x = param,
    y = est,
    color = LatentClass,
    shape = LatentClass,
    group = LatentClass,
    lty = LatentClass
  )
) +
  geom_point(size = 2.5) +
  geom_line(linewidth = 0.8) +
  scale_colour_viridis_d() +
  facet_wrap(~ model, ncol = 2) +
  labs(
    title = "RESS Mean Profiles Across Class Solutions",
    x = "Indicator",
    y = "Class-specific Mean"
  ) +
  theme_minimal() +
  theme(
    panel.grid.major.y = element_blank(),
    axis.text.x = element_text(angle = -45, hjust = -.1)
  )

# Display figure
compare_figure

# Save figure
ggsave(
  filename = here::here("figures", "compare_class_solutions.png"),
  plot = compare_figure,
  dpi = 300,
  height = 6,
  width = 9,
  units = "in"
)

```


#LPA


```{r}
plot_lpa <- function(model_name) {
  
  #### 1. Extract ONLY means (continuous LPA)
  means_df <- model_name$parameters$unstandardized %>%
    dplyr::filter(
      param %in% c(
        "RESS_RUM","RESS_ENG","RESS_REAP",
        "RESS_SUP","RESS_REL","RESS_DIS"
      ),
      paramHeader == "Means"                 # ★ THIS FIXES DUPLICATES ★
    ) %>%
    dplyr::select(param, LatentClass, est) %>%
    dplyr::mutate(
      LatentClass = as.integer(LatentClass)
    )
  
  #### 2. Class proportions
  props_vec <- model_name$class_counts$modelEstimated$proportion
  
  props_df <- tibble::tibble(
    LatentClass = seq_along(props_vec),
    prop = round(props_vec * 100, 1)
  )
  
  #### 3. Join means + proportions
  plot_df <- means_df %>%
    dplyr::left_join(props_df, by = "LatentClass") %>%
    dplyr::mutate(
      param = tolower(param),
      param = factor(param,
        levels = c("ress_rum","ress_eng","ress_reap",
                   "ress_sup","ress_rel","ress_dis")
      ),
      ClassLabel = factor(
        paste0("Class ", LatentClass, " (", prop, "%)")
      )
    )
  
  #### 4. Title
  model_title <- model_name$input$title
  
  #### 5. Plot
  p <- ggplot(
    plot_df,
    aes(
      x = param,
      y = est,
      color = ClassLabel,
      shape = ClassLabel,
      group = ClassLabel,
      linetype = ClassLabel
    )
  ) +
    geom_point(size = 3) +
    geom_line(linewidth = 0.9) +
    scale_colour_viridis_d() +
    labs(
      title = paste0(model_title, " Mean Profile Plot"),
      x = "Indicator",
      y = "Class-specific Mean"
    ) +
    theme_minimal() +
    theme(
      text = element_text(family = "serif", size = 12),
      legend.position = "top",
      legend.title = element_blank(),
      axis.text.x = element_text(angle = -45, hjust = 0),
      panel.grid.major.y = element_blank()
    )
  
  return(p)
}

```



```{r}
p2 <- plot_lpa(output_ress$c2_ress.out)
p2
ggsave(filename = here::here("figures", "plot_2ps.png"),plot = p2, dpi = 300,
  height = 6, width = 9, units = "in")


p3 <- plot_lpa(output_ress$c3_ress.out)
p3
ggsave(filename = here::here("figures", "plot_3ps.png"),plot = p3, dpi = 300,
  height = 6, width = 9, units = "in")


p4 <- plot_lpa(output_ress$c4_ress.out)
p4
ggsave(filename = here::here("figures", "plot_4ps.png"),plot = p4, dpi = 300,
  height = 6, width = 9, units = "in")


p5 <- plot_lpa(output_ress$c5_ress.out)
p5
ggsave(filename = here::here("figures", "plot_5ps.png"),plot = p5, dpi = 300,
  height = 6, width = 9, units = "in")


p6 <- plot_lpa(output_ress$c6_ress.out)
p6
ggsave(filename = here::here("figures", "plot_6ps.png"),plot = p6, dpi = 300,
  height = 6, width = 9, units = "in")


```



