Condom Use Among Men at Mafeteng Hospital, Lesotho

Author

Lefosa Molefe, Mashea Amelia & Amstutz Alain

Department of Nursing, Faculty of Health Sciences, National University of Lesotho

Packages

Code

req_pkgs <- c("readxl",
              "dplyr",
              "tidyr",
              "here",
              "ggplot2",
              "gtsummary",
              "forcats",
              "broom"
)
install_if_missing <- function(pkgs){
  for(p in pkgs){
    if(!requireNamespace(p, quietly=TRUE)){
      install.packages(p, repos="https://cloud.r-project.org")
    }
    library(p, character.only=TRUE)
  }
}
install_if_missing(req_pkgs)

(1) Variable formatting and main outcome

Main outcome Condom use & Reasons for non-use

Code

# Import
df <- read_excel(here("df.xlsx"))

# Remove row with "#NULL!"
df <- df %>%
  filter(!if_any(everything(), ~ . == "#NULL!"))

# Numeric continuous variables
numeric_vars <- c("Age", "Duration", "Age_Difference", "Duration_Dating")

# Ordinal Likert-scale variables (1–5), others convert to factor for now
likert_vars <- c(
  "Lack_Trust", "Enhance_Pleasure", "Decrease_Pleasure", "Beautiful_Girls",
  "No_love", "Suggest_Use", "Morally_wrong", "Messy", "Unprotected_sex",
  "Heightened_excitement", "Responsible_sexual_behaviour", "Women_perception",
  "Embarrassed_Purchasing", "Confident_putting_on", "Regret_Later",
  "Religion_and_Culture", "Less_masculine", "Woman_Resposibility", "Promiscuity",
  "Taboo", "Personal_Choice", "Prevent_STIs", "Effective_Contraception", "Easy_Use",
  "Expensive", "Easily_Available", "Poor_Quality", "Comfortable", "Dry_out",
  "Breakage", "Bad_smell"
)

# Convert variables to appropriate types
df <- df %>%
  mutate(
    # Convert numeric vars to numeric
    across(all_of(numeric_vars), ~ as.numeric(.)),

    # Convert Likert vars to ordered factors
    across(all_of(likert_vars), ~ factor(as.numeric(.), 
                                         levels = 1:5, 
                                         ordered = TRUE)),

    # Everything else becomes unordered factor
    across(-c(all_of(numeric_vars), all_of(likert_vars)), as.factor)
  )

# Outcome variable and reasons for non-use
df <- df %>%
  mutate(
    Condom_use = as.numeric(Condom_use),
    Disuse = as.numeric(Disuse)
  ) %>%
  mutate(
    Condom_use = factor(
      Condom_use,
      levels = c(1, 2),
      labels = c("Used Condom", "Did Not Use Condom")
    ),
    Disuse = factor(
      Disuse,
      levels = 1:8,
      labels = c(
        "Alcohol",
        "Use condoms?",
        "Trust partner",
        "Uncomfortable",
        "Did not think much about",
        "Unavailable",
        "Decrease pleasure",
        "Never used a condom"
      )
    )
  )

# Prepare plot data incl. percentages
cds_use <- df %>%
  count(Condom_use) %>%
  mutate(percent = n / sum(n) * 100) %>%
  arrange(desc(n))
reason_counts <- df %>%
  filter(Condom_use == "Did Not Use Condom") %>%
  count(Disuse) %>%
  mutate(percent = n / sum(n) * 100) %>%
  arrange(desc(n))

# Plot: Condom use
ggplot(cds_use, aes(x = reorder(Condom_use, percent), y = percent)) +
  geom_col(fill = "steelblue") +
  geom_text(aes(label = n),           # counts inside bar
            hjust = 1.5, color = "white", size = 3.5) +  # moved left
  geom_text(aes(y = percent + 3,      # percentages outside bar
                label = paste0(round(percent, 1), "%")), 
            hjust = 0, size = 3.5) +
  coord_flip() +
  labs(
    title = "Condom Use",
    subtitle = "Among all respondents (n=93)",
    x = "",
    y = "Percentage displayed (count in white)"
  ) +
  theme_minimal(base_size = 13) +
  theme(
    plot.title = element_text(face = "bold"),
    plot.subtitle = element_text(color = "gray40")
  ) +
  expand_limits(y = max(cds_use$percent) * 1.2)

Code

# Plot: Reasons for not using condoms
ggplot(reason_counts, aes(x = reorder(Disuse, percent), y = percent)) +
  geom_col(fill = "steelblue") +
  geom_text(aes(label = n),           # counts inside bar
            hjust = 1.5, color = "white", size = 3.5) +  # moved left
  geom_text(aes(y = percent + 3,      # percentages outside bar
                label = paste0(round(percent, 1), "%")), 
            hjust = 0, size = 3.5) +
  coord_flip() +
  labs(
    title = "Reasons for Not Using Condoms",
    subtitle = "Among respondents who did not use condoms (n=53)",
    x = "",
    y = "Percentage displayed (count in white)"
  ) +
  theme_minimal(base_size = 13) +
  theme(
    plot.title = element_text(face = "bold"),
    plot.subtitle = element_text(color = "gray40")
  ) +
  expand_limits(y = max(reason_counts$percent) * 1.2)

(2) Baseline table

Code

# Baseline characteristics, keeping Condom_use for stratification
df <- df %>%
  mutate(
    Duration = na_if(Duration, 999),
    Age_Difference = na_if(Age_Difference, 177),
    Duration_Dating = na_if(Duration_Dating, 188)
  )
df <- df %>%
  mutate(
    Duration = case_when(Duration == 77 ~ 0.5,
                         TRUE ~ Duration),
    Duration_Dating = case_when(Duration == 77 ~ 0.5,
                         TRUE ~ Duration_Dating)
  )
df <- df %>%
  mutate(
    Qualification = factor(Qualification,
      levels = c("1.000000", "2.000000", "3.000000", "4.000000", "5.000000"),
      labels = c("Primary", "Secondary", "High School", "Tertiary", "Masters Degree")),
    Income = factor(Income,
      levels = c("1.000000", "2.000000", "3.000000", "4.000000"),
      labels = c("employed", "self-employed", "Piece jobs", "Parental Support")),
    Religion = factor(Religion,
      levels = c("1.000000", "2.000000", "3.000000", "4.000000", "5.000000", "6.000000", "7.000000", "8.000000", "9.000000", "10.000000", "11.000000"),
      labels = c("Lesotho Evangelical Church of Southern Africa", "Roman Catholic Church", 
                 "Anglican Church of Southern Africa", "Apostolic Church", "Buddism", 
                 "St. Johns", "Not Affiliated", "Born Again Christian Church", 
                 "Jehova's Witness", "Dutch Reformed Church", "Muslim")),
    Sex = factor(Sex,
      levels = c("1.000000", "2.000000", "3.000000", "4.000000"),
      labels = c("Hetero", "Gay", "Bisexual", "Rather not say"))
  )



baseline_vars <- df %>%
  select(Age, Marriage, Duration, Relationship, Age_Difference,
         Duration_Dating, Qualification, Income, Religion, Sex, Condom_use)

tbl_baseline <- tbl_summary(
  data = baseline_vars,
  by = Condom_use,
  label = list(
    Age ~ "Age (years)",
    Marriage ~ "Marital Status",
    Duration ~ "Relationship Duration (years)",
    Relationship ~ "Relationship Type",
    Age_Difference ~ "Age Difference (months)",
    Duration_Dating ~ "Dating Duration",
    Qualification ~ "Education Level",
    Income ~ "Source of Income",
    Religion ~ "Religion",
    Sex ~ "Sexual Orientation"
  ),
  type = list(
    Age ~ "continuous",
    Duration ~ "continuous",
    Age_Difference ~ "continuous",
    Duration_Dating ~ "continuous"
  ),
  statistic = list(
    all_continuous() ~ "{mean} ({sd})",
    all_categorical() ~ "{n} ({p}%)"
  ),
  missing = "no"
) %>%
  add_overall() %>%
  bold_labels() %>%
  modify_header(label = "**Variable**") %>%
  modify_caption("**Baseline Table Stratified by Condom Use**")

tbl_baseline

**Baseline Table Stratified by Condom Use**
Variable	Overall N = 93¹	Used Condom N = 40¹	Did Not Use Condom N = 53¹
Age (years)	27 (7)	28 (7)	26 (6)
Marital Status
1.000000	28 (30%)	13 (33%)	15 (28%)
2.000000	64 (69%)	26 (65%)	38 (72%)
22.000000	1 (1.1%)	1 (2.5%)	0 (0%)
Relationship Duration (years)	5.8 (6.0)	6.5 (6.3)	5.2 (5.8)
Relationship Type
111.000000	30 (32%)	14 (35%)	16 (30%)
2.000000	2 (2.2%)	0 (0%)	2 (3.8%)
3.000000	48 (52%)	20 (50%)	28 (53%)
4.000000	13 (14%)	6 (15%)	7 (13%)
Age Difference (months)	3.27 (2.86)	4.00 (3.28)	2.69 (2.36)
Dating Duration	13 (27)	18 (31)	10 (24)
Education Level
Primary	9 (9.7%)	6 (15%)	3 (5.7%)
Secondary	11 (12%)	5 (13%)	6 (11%)
High School	40 (43%)	17 (43%)	23 (43%)
Tertiary	31 (33%)	12 (30%)	19 (36%)
Masters Degree	2 (2.2%)	0 (0%)	2 (3.8%)
Source of Income
employed	23 (25%)	10 (25%)	13 (25%)
self-employed	23 (25%)	9 (23%)	14 (26%)
Piece jobs	23 (25%)	11 (28%)	12 (23%)
Parental Support	24 (26%)	10 (25%)	14 (26%)
Religion
Lesotho Evangelical Church of Southern Africa	20 (22%)	7 (18%)	13 (25%)
Roman Catholic Church	23 (25%)	9 (23%)	14 (26%)
Anglican Church of Southern Africa	9 (9.7%)	4 (10%)	5 (9.4%)
Apostolic Church	10 (11%)	5 (13%)	5 (9.4%)
Buddism	3 (3.2%)	3 (7.5%)	0 (0%)
St. Johns	3 (3.2%)	1 (2.5%)	2 (3.8%)
Not Affiliated	16 (17%)	6 (15%)	10 (19%)
Born Again Christian Church	6 (6.5%)	4 (10%)	2 (3.8%)
Jehova's Witness	1 (1.1%)	0 (0%)	1 (1.9%)
Dutch Reformed Church	1 (1.1%)	1 (2.5%)	0 (0%)
Muslim	1 (1.1%)	0 (0%)	1 (1.9%)
Sexual Orientation
Hetero	86 (92%)	36 (90%)	50 (94%)
Gay	0 (0%)	0 (0%)	0 (0%)
Bisexual	1 (1.1%)	1 (2.5%)	0 (0%)
Rather not say	6 (6.5%)	3 (7.5%)	3 (5.7%)
¹ Mean (SD); n (%)

Levels for Marital Status?
Levels for “Relationship Type”?
Is Relationship Duration (years) only for those married and Dating Duration more general?
Age Difference (years): Is this + or - or both?

(3) Personal Barriers re Condom Use

1 represents strongly disagree and 5 Strongly agree

Code

likert_vars <- c(
  "Lack_Trust", "Enhance_Pleasure", "Decrease_Pleasure", "Beautiful_Girls", "No_love", "Suggest_Use",
  "Morally_wrong", "Messy", "Unprotected_sex", "Heightened_excitement",
  "Responsible_sexual_behaviour", "Women_perception", "Embarrassed_Purchasing",
  "Confident_putting_on", "Regret_Later"
)

var_labels <- c(
  "Lack_Trust" = "Using condoms means lack of trust",
  "Enhance_Pleasure" = "Condoms enhance sexual pleasure",
  "Decrease_Pleasure" = "Condoms decrease sexual pleasure",
  "Beautiful_Girls" = "Beautiful girls are safe",
  "No_love" = "Using condoms means lack of love",
  "Suggest_Use" = "I feel comfortable suggesting use of condoms",
  "Morally_wrong" = "Morally wrong to use condoms",
  "Messy" = "Condoms are messy",
  "Unprotected_sex" = "Excitement of unprotected sex",
  "Heightened_excitement" = "Condom use heightens pleasure",
  "Responsible_sexual_behaviour" = "Using a condom is a woman’s responsibility",
  "Women_perception" = "Women think men who use condoms cheat",
  "Embarrassed_Purchasing" = "Embarrassed purchasing a condom",
  "Confident_putting_on" = "Confident in my ability to use a condom",
  "Regret_Later" = "I only need to worry later"
)

# Drop rows with NA
df_likert <- df %>%
  select(all_of(likert_vars)) %>%
  drop_na()

# Reshape data
likert_long <- df_likert %>%
  pivot_longer(cols = everything(), names_to = "Variable", values_to = "Response") %>%
  mutate(
    Variable = recode(Variable, !!!var_labels),
    Response = as.numeric(as.character(Response))
  ) %>%
  mutate(
    Direction = case_when(
      Response %in% c(1,2) ~ "Disagree",
      Response == 3 ~ "Neutral",
      Response %in% c(4,5) ~ "Agree"
    ),
    ResponseLabel = case_when(
      Response == 1 ~ "Strongly Disagree",
      Response == 2 ~ "Disagree",
      Response == 3 ~ "Neutral",
      Response == 4 ~ "Agree",
      Response == 5 ~ "Strongly Agree"
    )
  )

# Percentages
likert_perc <- likert_long %>%
  group_by(Variable, ResponseLabel, Direction) %>%
  summarise(n = n(), .groups = "drop") %>%
  group_by(Variable) %>%
  mutate(percent = n / sum(n) * 100) %>%
  ungroup()

# Diverging percentages
likert_perc <- likert_perc %>%
  mutate(percent_diverge = case_when(
    Direction == "Disagree" ~ -percent,
    Direction == "Agree" ~ percent,
    TRUE ~ 0
  ))

# Drop unused factor levels for plotting
likert_perc$ResponseLabel <- droplevels(factor(likert_perc$ResponseLabel))
likert_perc$Variable <- fct_rev(factor(likert_perc$Variable))

# Factor order for fill
likert_perc$ResponseLabel <- factor(
  likert_perc$ResponseLabel,
  levels = c("Strongly Disagree","Disagree","Agree","Strongly Agree")
)

# Max agree for neutral bar offset
max_agree <- max(likert_perc$percent_diverge[likert_perc$Direction=="Agree"])
neutral_offset <- max_agree + 26

# Dynamic x-axis limits
x_min <- floor(min(likert_perc$percent_diverge[likert_perc$Direction != "Neutral"]) / 10) * 10
neutral_max <- max(likert_perc$percent[likert_perc$Direction == "Neutral"])
x_max <- ceiling((neutral_offset + neutral_max) / 10) * 10

# Subset for diverging bars
likert_perc_div <- subset(likert_perc, Direction != "Neutral")
likert_perc_div$ResponseLabel <- factor(
  likert_perc_div$ResponseLabel,
  levels = c("Strongly Disagree","Disagree","Agree","Strongly Agree")
)
likert_perc_div$Variable <- droplevels(likert_perc_div$Variable)

# Subset for neutral bars with percent > 0
neutral_data <- subset(likert_perc, Direction == "Neutral" & percent > 0)
neutral_data$Variable <- droplevels(neutral_data$Variable)

# Plot
ggplot() +
  # Diverging bars
  geom_col(
    data = likert_perc_div,
    aes(x = percent_diverge, y = Variable, fill = ResponseLabel),
    width = 0.7
  ) +
  # Neutral bars as thin grey rectangles
  geom_rect(
    data = neutral_data,
    aes(
      xmin = neutral_offset,
      xmax = neutral_offset + percent,
      ymin = as.numeric(Variable) - 0.3,
      ymax = as.numeric(Variable) + 0.3
    ),
    fill = "#f0f0f0"
  ) +
  # Neutral labels
  geom_text(
    data = neutral_data,
    aes(
      x = neutral_offset + percent + 1,
      y = as.numeric(Variable),
      label = paste0(round(percent,1),"%")
    ),
    hjust = 0,
    size = 3
  ) +
  # Colors for diverging bars
  scale_fill_manual(
    values = c(
      "Strongly Disagree" = "#d73027",
      "Disagree" = "#fc8d59",
      "Agree" = "#91cf60",
      "Strongly Agree" = "#1a9850"
    )
  ) +
  # X-axis
  scale_x_continuous(
    labels = abs,
    breaks = seq(x_min, x_max, 10),
    limits = c(x_min, x_max)
  ) +
  labs(
    x = "Percentage",
    y = "",
    fill = "Response",
    title = "Personal Barriers to Condom Utilization",
    subtitle = "Neutrals displayed as separate grey bars"
  ) +
  theme_minimal(base_size = 13) +
  theme(
    axis.text.y = element_text(face = "bold"),
    legend.position = "bottom",
    panel.grid.major.x = element_line(color = "gray80", size = 0.3),
    panel.grid.minor.x = element_line(color = "gray90", size = 0.2),
    plot.subtitle = element_text(size = 11, color = "gray50") 
  )

In CSV file there are 15 questions (see Unprotected_sex and Heightened_excitement), but in the manuscript only 14 ?!? Please check

(4) Personal Barriers on Condom use

– Add variable levels ––

Code

# Convert Likert factors to numeric and calculate average barrier score
df_numeric <- df %>%
  mutate(across(all_of(likert_vars), ~ as.numeric(as.character(.)))) %>%
  rowwise() %>%
  mutate(
    Barrier_Score = mean(c_across(all_of(likert_vars)), na.rm = TRUE)
  ) %>%
  ungroup()

# Outcome
df_numeric$Condom_use <- factor(df_numeric$Condom_use,
                                levels = c("Used Condom", "Did Not Use Condom"))

# Logistic regression
model_total <- glm(
  Condom_use ~ Barrier_Score,
  data = df_numeric,
  family = binomial
)

# Output
tbl_1 <- model_total %>%
  tbl_regression(
    intercept = TRUE,
    estimate_fun = function(x) style_sigfig(x, digits = 4),
    label = list(Barrier_Score ~ "Average Barrier Score (1–5)"),
    tidy_fun = broom.helpers::tidy_parameters,
    exponentiate = TRUE   # show OR instead of log-odds
  ) %>%
  modify_caption("Association of Average Barrier Score with Condom Use") %>%
  modify_column_hide(columns = "p.value")
tbl_1

Association of Average Barrier Score with Condom Use
Characteristic	OR	95% CI
(Intercept)	0.0904	0.0032, 2.142
Average Barrier Score (1–5)	2.468	0.8591, 7.593
Abbreviations: CI = Confidence Interval, OR = Odds Ratio

Code

ggplot(df_numeric, aes(x = Condom_use, y = Barrier_Score, fill = Condom_use)) +
  geom_boxplot() +
  labs(x = "Condom Use", y = "Average Barrier Score") +
  theme_minimal()