data(iris)
ggplot(iris, aes(x = Sepal.Length)) + geom_histogram(aes(y = ..density..), bins = 30, fill = “blue”, alpha = 0.7) + geom_density(color = “red”) + ggtitle(“Гистограмма и плотность Sepal.Length”)
qqPlot(iris$Sepal.Length, main = “Q-Q график Sepal.Length”)
shapiro_test <- shapiro.test(iris$Sepal.Length) shapiro_test
ks_test <- ks.test(iris\(Sepal.Length, "pnorm", mean = mean(iris\)Sepal.Length), sd = sd(iris$Sepal.Length)) ks_test
skewness(iris\(Sepal.Length) kurtosis(iris\)Sepal.Length)
set.seed(0) data <- data.frame( V12 = rnorm(100), V13 = rnorm(100), V15 = rnorm(100), region = sample(c(“North”, “South”, “East”, “West”), 100, replace = TRUE), age = sample(18:70, 100, replace = TRUE), V14 = sample(c(“Option1”, “Option2”, “Option3”), 100, replace = TRUE), V16 = sample(c(“OptionA”, “OptionB”, “OptionC”), 100, replace = TRUE) )
univariate_analysis <- function(data, variables) { for (variable in variables) { print(ggplot(data, aes_string(x = variable)) + geom_histogram(aes(y = ..density..), bins = 30, fill = “blue”, alpha = 0.7) + geom_density(color = “red”) + ggtitle(paste(“Гистограмма и плотность”, variable)))
print(summary(data[[variable]]))
} }
univariate_analysis(data, c(“V12”, “V13”, “V15”))
bivariate_analysis <- function(data, variable1, variable2) { print(ggplot(data, aes_string(x = variable1, y = variable2)) + geom_boxplot() + ggtitle(paste(“Боксплот”, variable2, “по”, variable1))) }
bivariate_analysis(data, “region”, “age”)
multiple_choice_analysis <- function(data, variables, by_variable) { for (variable in variables) { print(ggplot(data, aes_string(x = by_variable, fill = variable)) + geom_bar(position = “dodge”) + ggtitle(paste(“Гистограмма”, variable, “по”, by_variable))) } }
multiple_choice_analysis(data, c(“V14”, “V16”), “region”)