Teknik Sampling and Survey

Pertemuan 11

Check Sheet

# Buat data check sheet
check_sheet <- data.frame(
  No = 1:20,
  Date = c("16/04/2025", "17/04/2025", "18/04/2025", "19/04/2025", "20/04/2025",
           "21/04/2025", "22/04/2025", "23/04/2025", "24/04/2025", "25/04/2025",
           "26/04/2025", "27/04/2025", "28/04/2025", "29/04/2025", "30/04/2025",
           "01/05/2025", "02/05/2025", "03/05/2025", "04/05/2025", "05/05/2025"),
  Jenis_Error = c("Login Failed", "Crash", "Crash", "Time", "UI Not Responding",
                  "Login Failed", "Time", "Crash", "Time", "UI Not Responding",
                  "Login Failed", "Time", "Crash", "Validation Error", "Login Failed",
                  "Login Failed", "Time", "Crash", "Validation Error", "UI Not Responding")
)

# Tampilkan tabel
datatable(check_sheet, options = list(pageLength = 5))
# Count frequency of each errors
library(dplyr)
library(DT)

error_summary <- check_sheet %>%
  count(Jenis_Error, sort = TRUE) %>%
  rename(Frequency = n)

# Display summary table
datatable(
  error_summary,
  options = list(
    scrollCollapse = TRUE,
    searching = FALSE,   # Remove search box
    paging = FALSE       # Remove pagination
  ),
  rownames = FALSE,
  caption = htmltools::tags$caption(
    style = 'caption-side: top; text-align: left; 
             font-size: 18px; font-weight: bold;',
    'Check Sheet: Summary of Error'
  ),
  class = 'stripe hover compact'
)
library(plotly)

# Interactive bar chart using plotly
plot_ly(error_summary,
        x = ~Frequency,
        y = ~reorder(Jenis_Error, Frequency),
        type = 'bar',
        orientation = 'h',
        marker = list(
          color = ~Frequency,
          colorscale = 'Cividis',  # Can also try: 'Bluered', '', 'YlOrRd'
          showscale = TRUE
        )
) %>%
  layout(
    title = list(text = "Check Sheet: Frequency of Erros", font = list(size = 18)),
    xaxis = list(title = "Frequency"),
    yaxis = list(title = "Error"),
    margin = list(l = 120)
  )

Control Flow

# Load libraries
library(plotly)
library(dplyr)

# Buat data waktu loading aplikasi
loading_data <- data.frame(
  Date = 1:30,
  Loading_Time = c(
    2.1, 2.0, 2.3, 1.9, 2.2, 2.0, 2.4, 2.1, 2.0, 2.5,
    1.8, 2.3, 2.1, 2.0, 2.2, 2.6, 1.9, 2.1, 2.2, 2.0,
    2.7, 2.3, 2.0, 2.1, 2.2, 2.0, 2.3, 1.8, 2.4, 2.1
  )
)

# Tentukan batas kendali
CL <- 2.1
UCL <- 2.4
LCL <- 1.8

# Tandai outliers
loading_data <- loading_data %>%
  mutate(Outlier = ifelse(Loading_Time > UCL | Loading_Time < LCL, "Ya", "Tidak"))

# Buat plot
plot_ly(loading_data, x = ~Date, y = ~Loading_Time, type = 'scatter', mode = 'lines+markers',
        line = list(color = 'blue'), 
        marker = list(size = 8, color = ifelse(loading_data$Outlier == "Ya", "red", "blue")),
        hoverinfo = 'text',
        text = ~paste("Hari:", Date, "<br>Waktu Loading:", Loading_Time, "detik")) %>%
  add_lines(y = rep(CL, 30), name = "CL", line = list(color = 'green', dash = 'dot')) %>%
  add_lines(y = rep(UCL, 30), name = "UCL", line = list(color = 'red', dash = 'dot')) %>%
  add_lines(y = rep(LCL, 30), name = "LCL", line = list(color = 'red', dash = 'dot')) %>%
  layout(title = "Control Chart – Periodic Application Loading Time",
         xaxis = list(title = "Hari"),
         yaxis = list(title = "Waktu Loading (detik)"),
         legend = list(orientation = 'h', x = 0.3, y = -0.2))

Fishbone Diagram

# Load library
library(DiagrammeR)

# Create fishbone diagram
graph <- grViz("
digraph fishbone {
  graph [layout = dot, rankdir = LR]

  # Default node styles
  node [fontname=Helvetica, fontsize=25, style=filled]

  # Central problem
  Problem [label='Main Causes of \\n System Crashes', shape=ellipse, fillcolor=lightcoral, width=5.0, height=1.2]

  # Category nodes (shared style)
  node [shape=diamond, width=2.5, height=1.0, fillcolor='#FFD700']
  A1 [label='Man']
  A2 [label='Method']
  A3 [label='Machine']
  A4 [label='Material']
  A5 [label='Environment']
  A6 [label='Measurement']

  # Reset node style for sub-categories
  node [shape=ellipse, width=2.5, height=0.6, fillcolor='#90EE90']
  A1a [label='Human error']
  A1b [label='Inadequate training']
  A1c [label='Overloaded staff']

  A2a [label='Poor coding practices']
  A2b [label='Lack of testing']

  A3a [label='Hardware failure']
  A3b [label='Overheating']

  A4a [label='Corrupted files']
  A4b [label='Incompatible software']

  A5a [label='Network instability']
  A5b [label='Power outages']

  A6a [label='Inaccurate logs']
  A6b [label='Faulty monitoring tools']

  # Relationships
  A1 -> Problem
  A2 -> Problem
  A3 -> Problem
  A4 -> Problem
  A5 -> Problem
  A6 -> Problem

  A1a -> A1
  A1b -> A1
  A1c -> A1

  A2a -> A2
  A2b -> A2

  A3a -> A3
  A3b -> A3

  A4a -> A4
  A4b -> A4

  A5a -> A5
  A5b -> A5

  A6a -> A6
  A6b -> A6
}
")

# Tampilkan diagram langsung
graph
# Opsional: Simpan sebagai file HTML interaktif
# htmlwidgets::saveWidget(graph, "fishbone_system_crashes.html")

Flowchart

# Load library
library(DiagrammeR)

# Create flowchart
graph <- grViz("
digraph development_flow {
  graph [layout = dot, rankdir = TB]

  # Default node styles
  node [fontname=Helvetica, fontsize=12, style=filled]

  # Start node
  Start [label='Start', shape=circle, fillcolor=lightblue]

  # Process nodes
  Idea [label='Idea', shape=parallelogram, fillcolor=Blue, width=2.5]
  Coding [label='Coding', shape=box, fillcolor=orange, width=2.5]
  Testing [label='Testing', shape=box, fillcolor=orange, width=2.5]
  Deploy [label='Deploy', shape=box, fillcolor=orange, width=2.5]

  # Decision node
  Decision1 [label='Code Passes Tests?', shape=diamond, fillcolor=lightcoral, width=2.5]
  Decision2 [label='Deployment Successful?', shape=diamond, fillcolor=lightcoral, width=2.5]

  # End node
  Finish [label='Finish', shape=circle, fillcolor=lightgray]

  # Relationships
  Start -> Idea
  Idea -> Coding
  Coding -> Testing
  Testing -> Decision1
  Decision1 -> Deploy [label='Yes']
  Decision1 -> Coding [label='No']
  Deploy -> Decision2
  Decision2 -> Finish [label='Yes']
  Decision2 -> Testing [label='No']

  # Optional note
  Note [label='Note: Confirmed by QA Team', shape=note, fillcolor=lightyellow]
  Decision2 -> Note
}
")

# Tampilkan diagram langsung
graph

Histogram

# Load required library
library(plotly)

# Simulate Chrome-only error data
set.seed(123)
chrome_data <- data.frame(
  Errors = rnorm(200, mean = 8, sd = 2)
)

# Plot interactive histogram using Plotly
plot_ly(
  data = chrome_data,
  x = ~Errors,
  type = 'histogram',
  nbinsx = 20,
  marker = list(color = '#1f77b4', line = list(color = 'black', width = 1)),
  opacity = 0.75
) %>%
  layout(
    title = "Histogram of Errors – Chrome Browser",
    xaxis = list(title = "Number of Errors"),
    yaxis = list(title = "Frequency"),
    bargap = 0.1,
    plot_bgcolor = 'white',
    paper_bgcolor = 'white'
  )

Pareto Chart

# Load libraries
library(dplyr)
library(plotly)

# Create simulated data for bugs causing system disruptions
check_sheet <- data.frame(
  Bug_Type = c(
    rep("Memory Leak", 40), rep("Null Pointer", 30), 
    rep("API Failure", 15), rep("UI Freeze", 10), 
    rep("Database Error", 5)
  )
)

# Summarize the number of disruptions by bug type
pareto_data <- check_sheet %>%
  count(Bug_Type, sort = TRUE) %>%
  mutate(
    cum_freq = cumsum(n) / sum(n) * 100  # cumulative percentage
  )

# Create different colors for each Bug Type
colors <- RColorBrewer::brewer.pal(n = length(pareto_data$Bug_Type), name = "Set3")

# Create Plotly Pareto Chart
fig <- plot_ly()

# Add Bar Chart (Count) - with different colors
fig <- fig %>% add_bars(
  x = ~reorder(pareto_data$Bug_Type, -pareto_data$n),
  y = ~pareto_data$n,
  name = 'Number of Disruptions',
  marker = list(color = colors),
  yaxis = "y1"
)

# Add Cumulative Line
fig <- fig %>% add_lines(
  x = ~reorder(pareto_data$Bug_Type, -pareto_data$n),
  y = ~pareto_data$cum_freq,
  name = 'Cumulative (%)',
  yaxis = "y2",
  line = list(color = 'red', dash = 'dash')
)

# Add Cut-off Line at 80%
fig <- fig %>% add_lines(
  x = ~reorder(pareto_data$Bug_Type, -pareto_data$n),
  y = rep(80, length(pareto_data$Bug_Type)),
  name = 'Cut-off 80%',
  yaxis = "y2",
  line = list(color = 'green', dash = 'dot')
)

# Adjust layout
fig <- fig %>% layout(
  title = "Pareto Chart - Bugs Causing System Disruptions",
  xaxis = list(
    title = "Bug Types",
    tickangle = -45   # tilt 45 degrees
  ),
  yaxis = list(title = "Number of Disruptions"),
  yaxis2 = list(
    title = "Cumulative (%)",
    overlaying = "y",
    side = "right",
    range = c(0, 100)
  ),
  legend = list(x = 0.8, y = 0.75),
  shapes = list(
    list(
      type = "line",
      x0 = -0.5,
      x1 = length(pareto_data$Bug_Type) - 0.5,
      y0 = 80,
      y1 = 80,
      yref = "y2",
      line = list(color = "green", width = 2, dash = "dot")
    )
  )
)

# Show chart
fig

Scatter Diagram

# Load the required library
library(plotly)

# Set seed for reproducibility
set.seed(123)

# Create data with strong positive correlation
data <- data.frame(
  Active_Users = seq(100, 1000, by = 50),
  Response_Time = seq(100, 300, length.out = 19) + rnorm(19, mean = 0, sd = 10)
)

# Calculate the correlation coefficient
correlation_value <- cor(data$Active_Users, data$Response_Time)

# Create scatter plot with regression line
fig <- plot_ly(data, 
               x = ~Active_Users, 
               y = ~Response_Time, 
               type = 'scatter', 
               mode = 'markers',
               marker = list(color = 'darkblue', size = 10)) %>%
  add_lines(x = data$Active_Users, 
            y = predict(lm(Response_Time ~ Active_Users, data = data)), 
            line = list(color = 'red', dash = 'solid', width = 2)) %>%
  layout(title = paste("Scatter Diagram: Active Users vs Server Response Time\nCorrelation: ", round(correlation_value, 2)),
         xaxis = list(title = "Number of Active Users"),
         yaxis = list(title = "Server Response Time (ms)"))

# Show the plot
fig
---
title: "Teknik Sampling and Survey"
subtitle: "Pertemuan 11"
author: 
  - "Zain Iqbal Saputra_52240018"
  - "Chello Frhino Mike M_52240031"
date:  "Senin, 05/05/2025"
output:
  rmdformats::readthedown:   
    self_contained: true
    thumbnails: true
    lightbox: true
    gallery: true
    number_sections: false
    lib_dir: libs
    3df_print: "paged"
    code_folding: "show"
    code_download: yes
---

```{r, echo=FALSE, warning=FALSE, message=FALSE}
library(dplyr)
library(DT)
library(plotly)
library(stringi)
library(lubridate)
library(knitr)
library(readr)
```

# Check Sheet

```{r,message=FALSE,warning=FALSE}
# Buat data check sheet
check_sheet <- data.frame(
  No = 1:20,
  Date = c("16/04/2025", "17/04/2025", "18/04/2025", "19/04/2025", "20/04/2025",
           "21/04/2025", "22/04/2025", "23/04/2025", "24/04/2025", "25/04/2025",
           "26/04/2025", "27/04/2025", "28/04/2025", "29/04/2025", "30/04/2025",
           "01/05/2025", "02/05/2025", "03/05/2025", "04/05/2025", "05/05/2025"),
  Jenis_Error = c("Login Failed", "Crash", "Crash", "Time", "UI Not Responding",
                  "Login Failed", "Time", "Crash", "Time", "UI Not Responding",
                  "Login Failed", "Time", "Crash", "Validation Error", "Login Failed",
                  "Login Failed", "Time", "Crash", "Validation Error", "UI Not Responding")
)

# Tampilkan tabel
datatable(check_sheet, options = list(pageLength = 5))
```


```{r,message=FALSE,warning=FALSE}
# Count frequency of each errors
library(dplyr)
library(DT)

error_summary <- check_sheet %>%
  count(Jenis_Error, sort = TRUE) %>%
  rename(Frequency = n)

# Display summary table
datatable(
  error_summary,
  options = list(
    scrollCollapse = TRUE,
    searching = FALSE,   # Remove search box
    paging = FALSE       # Remove pagination
  ),
  rownames = FALSE,
  caption = htmltools::tags$caption(
    style = 'caption-side: top; text-align: left; 
             font-size: 18px; font-weight: bold;',
    'Check Sheet: Summary of Error'
  ),
  class = 'stripe hover compact'
)
```

```{r,message=FALSE,warning=FALSE}
library(plotly)

# Interactive bar chart using plotly
plot_ly(error_summary,
        x = ~Frequency,
        y = ~reorder(Jenis_Error, Frequency),
        type = 'bar',
        orientation = 'h',
        marker = list(
          color = ~Frequency,
          colorscale = 'Cividis',  # Can also try: 'Bluered', '', 'YlOrRd'
          showscale = TRUE
        )
) %>%
  layout(
    title = list(text = "Check Sheet: Frequency of Erros", font = list(size = 18)),
    xaxis = list(title = "Frequency"),
    yaxis = list(title = "Error"),
    margin = list(l = 120)
  )
```

# Control Flow

```{r,message=FALSE,warning=FALSE}
# Load libraries
library(plotly)
library(dplyr)

# Buat data waktu loading aplikasi
loading_data <- data.frame(
  Date = 1:30,
  Loading_Time = c(
    2.1, 2.0, 2.3, 1.9, 2.2, 2.0, 2.4, 2.1, 2.0, 2.5,
    1.8, 2.3, 2.1, 2.0, 2.2, 2.6, 1.9, 2.1, 2.2, 2.0,
    2.7, 2.3, 2.0, 2.1, 2.2, 2.0, 2.3, 1.8, 2.4, 2.1
  )
)

# Tentukan batas kendali
CL <- 2.1
UCL <- 2.4
LCL <- 1.8

# Tandai outliers
loading_data <- loading_data %>%
  mutate(Outlier = ifelse(Loading_Time > UCL | Loading_Time < LCL, "Ya", "Tidak"))

# Buat plot
plot_ly(loading_data, x = ~Date, y = ~Loading_Time, type = 'scatter', mode = 'lines+markers',
        line = list(color = 'blue'), 
        marker = list(size = 8, color = ifelse(loading_data$Outlier == "Ya", "red", "blue")),
        hoverinfo = 'text',
        text = ~paste("Hari:", Date, "<br>Waktu Loading:", Loading_Time, "detik")) %>%
  add_lines(y = rep(CL, 30), name = "CL", line = list(color = 'green', dash = 'dot')) %>%
  add_lines(y = rep(UCL, 30), name = "UCL", line = list(color = 'red', dash = 'dot')) %>%
  add_lines(y = rep(LCL, 30), name = "LCL", line = list(color = 'red', dash = 'dot')) %>%
  layout(title = "Control Chart – Periodic Application Loading Time",
         xaxis = list(title = "Hari"),
         yaxis = list(title = "Waktu Loading (detik)"),
         legend = list(orientation = 'h', x = 0.3, y = -0.2))
```

# Fishbone Diagram

```{r,message=FALSE,warning=FALSE}
# Load library
library(DiagrammeR)

# Create fishbone diagram
graph <- grViz("
digraph fishbone {
  graph [layout = dot, rankdir = LR]

  # Default node styles
  node [fontname=Helvetica, fontsize=25, style=filled]

  # Central problem
  Problem [label='Main Causes of \\n System Crashes', shape=ellipse, fillcolor=lightcoral, width=5.0, height=1.2]

  # Category nodes (shared style)
  node [shape=diamond, width=2.5, height=1.0, fillcolor='#FFD700']
  A1 [label='Man']
  A2 [label='Method']
  A3 [label='Machine']
  A4 [label='Material']
  A5 [label='Environment']
  A6 [label='Measurement']

  # Reset node style for sub-categories
  node [shape=ellipse, width=2.5, height=0.6, fillcolor='#90EE90']
  A1a [label='Human error']
  A1b [label='Inadequate training']
  A1c [label='Overloaded staff']

  A2a [label='Poor coding practices']
  A2b [label='Lack of testing']

  A3a [label='Hardware failure']
  A3b [label='Overheating']

  A4a [label='Corrupted files']
  A4b [label='Incompatible software']

  A5a [label='Network instability']
  A5b [label='Power outages']

  A6a [label='Inaccurate logs']
  A6b [label='Faulty monitoring tools']

  # Relationships
  A1 -> Problem
  A2 -> Problem
  A3 -> Problem
  A4 -> Problem
  A5 -> Problem
  A6 -> Problem

  A1a -> A1
  A1b -> A1
  A1c -> A1

  A2a -> A2
  A2b -> A2

  A3a -> A3
  A3b -> A3

  A4a -> A4
  A4b -> A4

  A5a -> A5
  A5b -> A5

  A6a -> A6
  A6b -> A6
}
")

# Tampilkan diagram langsung
graph

# Opsional: Simpan sebagai file HTML interaktif
# htmlwidgets::saveWidget(graph, "fishbone_system_crashes.html")
```

# Flowchart

```{r,message=FALSE,warning=FALSE}
# Load library
library(DiagrammeR)

# Create flowchart
graph <- grViz("
digraph development_flow {
  graph [layout = dot, rankdir = TB]

  # Default node styles
  node [fontname=Helvetica, fontsize=12, style=filled]

  # Start node
  Start [label='Start', shape=circle, fillcolor=lightblue]

  # Process nodes
  Idea [label='Idea', shape=parallelogram, fillcolor=Blue, width=2.5]
  Coding [label='Coding', shape=box, fillcolor=orange, width=2.5]
  Testing [label='Testing', shape=box, fillcolor=orange, width=2.5]
  Deploy [label='Deploy', shape=box, fillcolor=orange, width=2.5]

  # Decision node
  Decision1 [label='Code Passes Tests?', shape=diamond, fillcolor=lightcoral, width=2.5]
  Decision2 [label='Deployment Successful?', shape=diamond, fillcolor=lightcoral, width=2.5]

  # End node
  Finish [label='Finish', shape=circle, fillcolor=lightgray]

  # Relationships
  Start -> Idea
  Idea -> Coding
  Coding -> Testing
  Testing -> Decision1
  Decision1 -> Deploy [label='Yes']
  Decision1 -> Coding [label='No']
  Deploy -> Decision2
  Decision2 -> Finish [label='Yes']
  Decision2 -> Testing [label='No']

  # Optional note
  Note [label='Note: Confirmed by QA Team', shape=note, fillcolor=lightyellow]
  Decision2 -> Note
}
")

# Tampilkan diagram langsung
graph
```

# Histogram

```{r,message=FALSE,warning=FALSE}
# Load required library
library(plotly)

# Simulate Chrome-only error data
set.seed(123)
chrome_data <- data.frame(
  Errors = rnorm(200, mean = 8, sd = 2)
)

# Plot interactive histogram using Plotly
plot_ly(
  data = chrome_data,
  x = ~Errors,
  type = 'histogram',
  nbinsx = 20,
  marker = list(color = '#1f77b4', line = list(color = 'black', width = 1)),
  opacity = 0.75
) %>%
  layout(
    title = "Histogram of Errors – Chrome Browser",
    xaxis = list(title = "Number of Errors"),
    yaxis = list(title = "Frequency"),
    bargap = 0.1,
    plot_bgcolor = 'white',
    paper_bgcolor = 'white'
  )
```

# Pareto Chart

```{r,message=FALSE,warning=FALSE}
# Load libraries
library(dplyr)
library(plotly)

# Create simulated data for bugs causing system disruptions
check_sheet <- data.frame(
  Bug_Type = c(
    rep("Memory Leak", 40), rep("Null Pointer", 30), 
    rep("API Failure", 15), rep("UI Freeze", 10), 
    rep("Database Error", 5)
  )
)

# Summarize the number of disruptions by bug type
pareto_data <- check_sheet %>%
  count(Bug_Type, sort = TRUE) %>%
  mutate(
    cum_freq = cumsum(n) / sum(n) * 100  # cumulative percentage
  )

# Create different colors for each Bug Type
colors <- RColorBrewer::brewer.pal(n = length(pareto_data$Bug_Type), name = "Set3")

# Create Plotly Pareto Chart
fig <- plot_ly()

# Add Bar Chart (Count) - with different colors
fig <- fig %>% add_bars(
  x = ~reorder(pareto_data$Bug_Type, -pareto_data$n),
  y = ~pareto_data$n,
  name = 'Number of Disruptions',
  marker = list(color = colors),
  yaxis = "y1"
)

# Add Cumulative Line
fig <- fig %>% add_lines(
  x = ~reorder(pareto_data$Bug_Type, -pareto_data$n),
  y = ~pareto_data$cum_freq,
  name = 'Cumulative (%)',
  yaxis = "y2",
  line = list(color = 'red', dash = 'dash')
)

# Add Cut-off Line at 80%
fig <- fig %>% add_lines(
  x = ~reorder(pareto_data$Bug_Type, -pareto_data$n),
  y = rep(80, length(pareto_data$Bug_Type)),
  name = 'Cut-off 80%',
  yaxis = "y2",
  line = list(color = 'green', dash = 'dot')
)

# Adjust layout
fig <- fig %>% layout(
  title = "Pareto Chart - Bugs Causing System Disruptions",
  xaxis = list(
    title = "Bug Types",
    tickangle = -45   # tilt 45 degrees
  ),
  yaxis = list(title = "Number of Disruptions"),
  yaxis2 = list(
    title = "Cumulative (%)",
    overlaying = "y",
    side = "right",
    range = c(0, 100)
  ),
  legend = list(x = 0.8, y = 0.75),
  shapes = list(
    list(
      type = "line",
      x0 = -0.5,
      x1 = length(pareto_data$Bug_Type) - 0.5,
      y0 = 80,
      y1 = 80,
      yref = "y2",
      line = list(color = "green", width = 2, dash = "dot")
    )
  )
)

# Show chart
fig
```

# Scatter Diagram

```{r,message=FALSE,warning=FALSE}
# Load the required library
library(plotly)

# Set seed for reproducibility
set.seed(123)

# Create data with strong positive correlation
data <- data.frame(
  Active_Users = seq(100, 1000, by = 50),
  Response_Time = seq(100, 300, length.out = 19) + rnorm(19, mean = 0, sd = 10)
)

# Calculate the correlation coefficient
correlation_value <- cor(data$Active_Users, data$Response_Time)

# Create scatter plot with regression line
fig <- plot_ly(data, 
               x = ~Active_Users, 
               y = ~Response_Time, 
               type = 'scatter', 
               mode = 'markers',
               marker = list(color = 'darkblue', size = 10)) %>%
  add_lines(x = data$Active_Users, 
            y = predict(lm(Response_Time ~ Active_Users, data = data)), 
            line = list(color = 'red', dash = 'solid', width = 2)) %>%
  layout(title = paste("Scatter Diagram: Active Users vs Server Response Time\nCorrelation: ", round(correlation_value, 2)),
         xaxis = list(title = "Number of Active Users"),
         yaxis = list(title = "Server Response Time (ms)"))

# Show the plot
fig
```