Red_Wine <- read.csv("~/Data Science Master Program/Spring 2022/Data Analytics I/red_wine.csv", sep = ';', quote = "")
which(is.na(Red_Wine))
## integer(0)
##  X.fixed.acidity X..volatile.acidity.. X..citric.acid.. X..residual.sugar..
##  Min.   : 4.60   Min.   :0.1200        Min.   :0.000    Min.   : 0.900     
##  1st Qu.: 7.10   1st Qu.:0.3900        1st Qu.:0.090    1st Qu.: 1.900     
##  Median : 7.90   Median :0.5200        Median :0.260    Median : 2.200     
##  Mean   : 8.32   Mean   :0.5278        Mean   :0.271    Mean   : 2.539     
##  3rd Qu.: 9.20   3rd Qu.:0.6400        3rd Qu.:0.420    3rd Qu.: 2.600     
##  Max.   :15.90   Max.   :1.5800        Max.   :1.000    Max.   :15.500     
##  X..chlorides..    X..free.sulfur.dioxide.. X..total.sulfur.dioxide..
##  Min.   :0.01200   Min.   : 1.00            Min.   :  6.00           
##  1st Qu.:0.07000   1st Qu.: 7.00            1st Qu.: 22.00           
##  Median :0.07900   Median :14.00            Median : 38.00           
##  Mean   :0.08747   Mean   :15.87            Mean   : 46.47           
##  3rd Qu.:0.09000   3rd Qu.:21.00            3rd Qu.: 62.00           
##  Max.   :0.61100   Max.   :72.00            Max.   :289.00           
##   X..density..       X..pH..      X..sulphates..    X..alcohol..  
##  Min.   :0.9901   Min.   :2.740   Min.   :0.3300   Min.   : 8.40  
##  1st Qu.:0.9956   1st Qu.:3.210   1st Qu.:0.5500   1st Qu.: 9.50  
##  Median :0.9968   Median :3.310   Median :0.6200   Median :10.20  
##  Mean   :0.9967   Mean   :3.311   Mean   :0.6581   Mean   :10.42  
##  3rd Qu.:0.9978   3rd Qu.:3.400   3rd Qu.:0.7300   3rd Qu.:11.10  
##  Max.   :1.0037   Max.   :4.010   Max.   :2.0000   Max.   :14.90  
##  X..quality...  
##  Min.   :3.000  
##  1st Qu.:5.000  
##  Median :6.000  
##  Mean   :5.636  
##  3rd Qu.:6.000  
##  Max.   :8.000
library(Hmisc)
## Warning: package 'Hmisc' was built under R version 4.0.5
## Loading required package: lattice
## Loading required package: survival
## Loading required package: Formula
## Warning: package 'Formula' was built under R version 4.0.3
## Loading required package: ggplot2
## Warning: package 'ggplot2' was built under R version 4.0.5
## 
## Attaching package: 'Hmisc'
## The following objects are masked from 'package:base':
## 
##     format.pval, units
hist.data.frame(Red_Wine)

par(mfrow = c(2,2))
boxplot(Red_Wine$X.fixed.acidity, xlab = "Fixed Acidity")
boxplot(Red_Wine$X..volatile.acidity.., xlab = 'Volatile Avidity')
boxplot(Red_Wine$X..citric.acid.., xlab = 'Citric Acid')
boxplot(Red_Wine$X..residual.sugar.., xlab = 'Residual Sugar')

par(mfrow = c(2,2))
boxplot(Red_Wine$X..chlorides.., xlab = 'Chlorides')
boxplot(Red_Wine$X..free.sulfur.dioxide..,xlab = 'Free Sulfur Dioxide')
boxplot(Red_Wine$X..total.sulfur.dioxide..,xlab = 'Total Sulfuer Dioxide')
boxplot(Red_Wine$X..density.., xlab = 'Density')

par(mfrow = c(2,2))
boxplot(Red_Wine$X..pH.., xlab = 'pH')
boxplot(Red_Wine$X..sulphates..,xlab = 'Sulphates')
boxplot(Red_Wine$X..alcohol..,xlab = 'Alcohol')
boxplot(Red_Wine$X..quality..., xlab = 'Quality')

plot(Red_Wine$X..pH.., Red_Wine$X..quality..., xlab = 'pH', ylab = 'Quality')