setwd("C:/Users/stg43/Charleston Data Analytics")
library(xlsx)
## Loading required package: rJava
## Loading required package: xlsxjars
sheet3<-read.xlsx("MeetupDataChallenge-1.xlsx", 3, header=T)
sheet3<-transform(sheet3, Run.Number=as.integer(Run.Number))
library(reshape)
sheet3m<-melt(sheet3, id=c("Run.Number", "Component"))
sheet3c<-cast(sheet3m, ...~Run.Number)
sheet3c<-as.data.frame(sheet3c)
sheet3f<-t(sheet3c)
sheet3f<-sheet3f[-2,]
storenames<-sheet3f[1,]
colnames(sheet3f)<-storenames
sheet3f<-sheet3f[-1,]
sheet3f<-as.data.frame(sheet3f)
x<-1:548
sheet3f$run<-x
sheet1<-read.xlsx("MeetupDataChallenge-1.xlsx", 1, header=T)
names(sheet1)[1]<-"run"
sheet1_3<-merge(sheet1, sheet3f, by="run")
toremove<-which(sheet1_3$Final.Yield.2>150)
sap_clean<-sheet1_3[-(toremove),]
factorColumns<-lapply(sap_clean[,5:35], as.factor)
factorColumns<-as.data.frame(factorColumns)
sap_clean<-cbind(sap_clean[1:4], factorColumns)
library(ggplot2)
ggplot(sap_clean, aes(run, Final.Yield.2))+geom_point(size=3)+geom_smooth()

library(gridExtra)
a<-ggplot(sap_clean, aes(Cassette.3,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
b<-ggplot(sap_clean, aes(Detergent,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
c<-ggplot(sap_clean, aes(Stabilizer.A,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
d<-ggplot(sap_clean, aes(WFI.Source,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
grid.arrange(a, b, c, d, ncol=2)

a<-ggplot(sap_clean, aes(Salt.A,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
b<-ggplot(sap_clean, aes(Salt.B,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
c<-ggplot(sap_clean, aes(Cassette.1,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
d<-ggplot(sap_clean, aes(Buffer.Salt.4,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
e<-ggplot(sap_clean, aes(Buffer.Salt.5,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)
grid.arrange(a, b, c, d, e, ncol=2)

ggplot(sap_clean, aes(Salt.A,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)+ geom_point(position = position_jitter(width = 0.2))

ggplot(sap_clean, aes(Salt.B,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)+ geom_point(position = position_jitter(width = 0.2))

ggplot(sap_clean, aes(Cassette.1,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)+ geom_point(position = position_jitter(width = 0.2))

ggplot(sap_clean, aes(Buffer.Salt.4,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)+ geom_point(position = position_jitter(width = 0.2))

ggplot(sap_clean, aes(Buffer.Salt.5,Final.Yield.2)) + geom_boxplot(outlier.shape = 3)+ geom_point(position = position_jitter(width = 0.2))

ggplot(sap_clean, aes(run, Final.Yield.2, color=Cassette.1))+geom_point(size=3.5)

ggplot(sap_clean, aes(run, Final.Yield.2, color=Buffer.Salt.5))+geom_point(size=3.5)
