This is a demo exploratory analysis report using example data created inside R. It demonstrates the basic steps for data exploration and reporting in preparation for building a prediction algorithm and Shiny app.
set.seed(123)
# Create a simple example training dataset with 100 rows
train <- data.frame(
feature_1 = rnorm(100, mean = 50, sd = 10),
feature_2 = sample(c("A", "B", "C"), 100, replace = TRUE),
target_variable = sample(c(0, 1), 100, replace = TRUE)
)
# Show the first 6 rows of the data
head(train)
## feature_1 feature_2 target_variable
## 1 44.39524 B 1
## 2 47.69823 B 1
## 3 65.58708 A 1
## 4 50.70508 B 0
## 5 51.29288 C 0
## 6 67.15065 C 0
# Histogram of feature_1
hist(train$feature_1, main = "Distribution of Feature 1", xlab = "Feature 1")
# Barplot of feature_2 categories
barplot(table(train$feature_2), main = "Count of Feature 2 Categories", xlab = "Category")