library(ggplot2)
## Warning: package 'ggplot2' was built under R version 3.3.3
library(dplyr)
## Warning: package 'dplyr' was built under R version 3.3.3
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(readr)
## Warning: package 'readr' was built under R version 3.3.3
library(gridExtra)
## Warning: package 'gridExtra' was built under R version 3.3.3
## 
## Attaching package: 'gridExtra'
## The following object is masked from 'package:dplyr':
## 
##     combine
library(plotly)
## Warning: package 'plotly' was built under R version 3.3.3
## 
## Attaching package: 'plotly'
## The following object is masked from 'package:ggplot2':
## 
##     last_plot
## The following object is masked from 'package:stats':
## 
##     filter
## The following object is masked from 'package:graphics':
## 
##     layout
library(ggrepel)
## Warning: package 'ggrepel' was built under R version 3.3.3
Diamonds <- read_csv("C:/RMIT/Data-Visualisation/R/Diamonds.csv")
## Parsed with column specification:
## cols(
##   carat = col_double(),
##   cut = col_character(),
##   color = col_character(),
##   clarity = col_character(),
##   depth = col_double(),
##   table = col_double(),
##   price = col_integer(),
##   x = col_double(),
##   y = col_double(),
##   z = col_double()
## )
Diamonds$cut<- factor(Diamonds$cut, levels=c('Fair','Good','Very Good','Premium','Ideal'), ordered=TRUE)
Diamonds$color<- factor(Diamonds$color, levels=c('J','I','H','G','F','E','D'), ordered=TRUE)
Diamonds$clarity<- factor(Diamonds$clarity, levels=c('I1','SI1','SI2','VS1','VS2','VVS1','VVS2','IF'), ordered=TRUE)
qplot(x = price, y = carat, data = Diamonds,colour = color, geom = "point", alpha=I(0.1)) +
  geom_smooth(method = "lm")+ggtitle("Diamond price VS carat across diamond colour(S3613572)")

p4 <- ggplot(data = Diamonds,aes(x = cut, y = price,fill = clarity))
p4 + geom_boxplot() + geom_jitter(alpha = 0.01) + ylab("Price") +
  ggtitle("Diamond price vs cut quality by clarity (S3613572) ") +
  stat_summary(fun.y=mean, colour="red", geom="point",shape = 17) +
  theme_minimal()+ facet_wrap(~ clarity )