This is an R Markdown Notebook. When you execute code within the notebook, the results appear beneath the code.
Try executing this chunk by clicking the Run button within the chunk or by placing your cursor inside it and pressing Ctrl+Shift+Enter.
#PLot 1
library(ggplot2)
setwd("C:/Users/vhtran/Google Drive/these/diver_selection")
#png(file = "7.png", width = 800, height = 800)
library(readr)
mydata <- read.csv("C:/Users/vhtran/Google Drive/these/diver_selection/dataplot3.csv", sep=";")
ggplot(mydata, aes(x=generations, y=value, colour=group, group=group)) +
geom_line(aes(linetype=as.factor(group1),color=as.factor(unit)),size=2) +
geom_point(aes(fill = group,shape = group))+
labs(list(y="value", x="generation"),size=20) +
theme_bw() +
theme(panel.border = element_blank(), panel.grid.major = element_blank(),
panel.grid.minor = element_blank(), axis.line = element_line(colour = "black"))+
theme(axis.text.x=element_text(angle=0, hjust=1,size=16),axis.text.y=element_text(angle=0, hjust=1,size=16)) +
scale_fill_brewer(type="qual", palette=2) +
scale_color_brewer(type="qual", palette=2) +
theme(axis.title.x = element_text( size=18))+
theme(axis.title.y = element_text(size=18))+
#ggtitle("Heritability over time")+
theme(legend.title=element_blank())+
guides(color = guide_legend(nrow=3))+
theme(legend.text = element_text(colour="blue", size = 16))+
theme(legend.key.size = unit(2, 'lines'))+
theme(plot.title = element_text(lineheight=5, face="bold", color="black", size=20))

#dev.off()
#Plot with EBV per week for each line-generation
library(reshape2)
library(plyr)
mydata_1 <- read.table("C:/Users/vhtran/Google Drive/these/diver_selection/FULL4.dat",quote="\"")
names(mydata_1)[1]<-"animal"
names(mydata_1)[2]<-"identif"
names(mydata_1)[3]<-"bande"
names(mydata_1)[4]<-"sexe"
names(mydata_1)[5]<-"lignee"
names(mydata_1)[6]<-"gener"
names(mydata_1)[7]<-"loge"
names(mydata_1)[8]<-"eleve"
names(mydata_1)[9]<- "pds_dc"
names(mydata_1)[10]<-"pds_fc"
names(mydata_1)[11]<-"age"
names(mydata_1)[12]<-"poidsheb"
names(mydata_1)[13]<-"poidpre2"
names(mydata_1)[14]<-"age_dc"
names(mydata_1)[15]<-"temps"
names(mydata_1)[16]<-"consoheb"
names(mydata_1)[17]<-"ADGv"
names(mydata_1)[18]<-"FCRv"
names(mydata_1)[19]<-"ADGg"
names(mydata_1)[20]<-"FCRg"
names(mydata_1)[21]<-"semaine"
names(mydata_1)[22]<-"period"
#mydata$temps=as.numeric(levels(mydata$temps))[mydata$temps]
#number animal
my1=mydata_1[,1:8]
my2=aggregate(my1, list(my1$animal), FUN=head, 1)
my2=arrange(my2,animal)
########################################################################################
# EBV for one records (mean of record)/ 3986 animals
EBV_all <- read.table("EBV_all1309.txt", quote="\"")
test<-melt(EBV_all,id.vars = 'animal')
test1=arrange(test,animal)
test1$EBV=test1$value
EBV_all1=test1[,c("animal","EBV")]
N_animal=length(unique(EBV_all1$animal))
EBV_all1$temps=c(rep(4:13,N_animal))
critere = c("animal")
mydata_EBV=merge(EBV_all1,my2,by=c(critere))
#class the animal
mydata_EBV1=arrange(mydata_EBV,animal,temps)
#results from k-mean trajectory classification
#group A (generation G0-G2)
#group B (generation G3-G7 line HRFI)
#group C (generation G3-G7 line HRFI)
mydata_EBV1$gr=paste(mydata_EBV1$gener,mydata_EBV1$lignee,collapse =NULL)
mydata_EBV1$group =ifelse(mydata_EBV1$gener=="G0"|mydata_EBV1$gener=="G1"|mydata_EBV1$gener=="G2","C",
ifelse(mydata_EBV1$gr=="G3 +"|mydata_EBV1$gr=="G4 +"|mydata_EBV1$gr=="G5 +"|mydata_EBV1$gr=="G6 +"|
mydata_EBV1$gr=="G7 +","B","A"))
#
# library(dplyr)
#
# gd <- mydata_EBV1 %>%
# group_by(group,temps) %>%
# summarise(
# EBV.mean = mean(EBV),
#
# )
#
# fix(gd)
#
#
#
# gd$group1=ifelse(gd$group=="A","G0-G2",ifelse(gd$group=="B","G3-G7/HRFI","G3 to G7/LRFI"))
gd <- read.csv("C:/Users/vhtran/Google Drive/these/diver_selection/gd1.csv", sep=";")
gd$temps=gd$temps-3
library(ggplot2)
setwd("C:/Users/vhtran/Google Drive/these/diver_selection")
#png(file = "7.png", width = 800, height = 800)
diver_selec <- read.table("C:/Users/vhtran/Google Drive/these/Sujet2/out.txt", quote="\"")
mydata=diver_selec
mydata$min=(mydata$EBV.mean-mydata$EBV.sd)
mydata$max=(mydata$EBV.mean+mydata$EBV.sd)
mydata$group1=paste(mydata$gener,mydata$lignee,collapse =NULL)
group=c(rep("C",50),rep("A",10),rep("B",10),rep("A",10),rep("B",10),rep("A",10),rep("B",10),
rep("A",10),rep("B",10),rep("A",10),rep("B",10))
mydata=cbind(mydata,group)
mydata$temps=mydata$temps-3
mydata_plot=mydata[,c("group","temps","EBV.mean","group1")]
mydata_plot1 = rbind(mydata_plot,gd)
library(ggplot2)
#???pp=ggplot(mydata, aes(x=generations, y=value, colour=group, group=group)) +
pp1= ggplot(mydata_plot1, aes(x=temps, y=EBV.mean, colour=group, group=group1)) +
geom_line(aes(linetype=group1, size = group1)) +
scale_linetype_manual(values=c("solid","solid","solid","solid",rep(c("solid","solid"),2),
rep(c("dotted","twodash"),5))) +
scale_size_manual(values=c(3,3,3,rep(0.5,15)))+
# geom_line(data = gd) +
geom_point(aes(fill = group1,shape = group1), # Shape depends on cond
size = 4) + # Large points
scale_shape_manual(values=c(1,1,1,1,5,6,7,8,rep(c(9,9,10,10,11,11,12,12,13,13),1))) +
scale_x_continuous(breaks=1:10) +
labs(list(y="EBV (kg feed/kg gain)", x="Week"),size=24) +
theme_bw() +
theme(panel.border = element_blank(), panel.grid.major = element_blank(),
panel.grid.minor = element_blank(), axis.line = element_line(colour = "black"))+
theme(axis.text.x=element_text(angle=0, hjust=1,size=24),axis.text.y=element_text(angle=0, hjust=1,size=24)) +
scale_fill_brewer(type="qual", palette=2) +
scale_color_brewer(type="qual", palette=2) +
theme(axis.title.x = element_text( size=24))+
theme(axis.title.y = element_text(size=24))+
#ggtitle("Heritability over time")+
theme(legend.title=element_blank())+
guides(color = guide_legend(nrow=3))+
theme(legend.text = element_text(colour="blue", size = 20))+
theme(legend.key.size = unit(2, 'lines'))+
theme(plot.title = element_text(lineheight=5, face="bold", color="black", size=20))
library(RColorBrewer)
myColors <- c("blue","red","green")
names(myColors) <- levels(mydata$group)
# myline=c("dotdash","solid", "dotted","dotdash","solid", "dotted")
# names(myline) <- levels(mydata$group)
#
colScale <- scale_colour_manual(name = "group",values = myColors)
# lineScale <- scale_colour_manual(name = "group",values = myline)
#png(file="EBV_gene_week1.png",width=1800,height=1200,res=100)
pp1+colScale
Scale for 'colour' is already present. Adding another scale for 'colour', which will replace the existing
scale.

#dev.off()
# CUREVES SBV FOR GENERATIONS
library(ggplot2)
mydata<- read.csv("C:/Users/vhtran/Google Drive/these/diver_selection/dataplot3.csv", sep=";")
mydata=mydata[1:32,]
pp1= ggplot(mydata, aes(x=generations, y=value, colour=group, group=group)) +
geom_line(aes(linetype=group), # Line type depends on cond
size = 1) +
#geom_point(aes(fill = group,shape = group1),
geom_point(aes(fill = group,shape = group),size = 3) +
# Shape depends on cond
# Large points
scale_linetype_manual(values=c("dotted","dotted","solid", "solid")) +
scale_shape_manual(values=c(8,8,1,1)) +
#geom_line(data=dataplot, aes(x=generations, y=value, group=group,col=as.factor(group1),linetype=as.factor(group), scale_fill_manual(values=c("blue","red"))))
#geom_line(aes(linetype=as.factor(group),color=as.factor(group)),size=2) +
#geom_errorbar(aes(ymin=min, ymax=max, colour=group,linetype=group), width=.4,
# position=position_dodge(0.05))+
# scale_colour_manual(name="Error Bars",values=cols, guide = guide_legend(fill = NULL,colour = NULL)) +
# scale_fill_manual(values=cols, guide="none") +
#scale_x_continuous(breaks=1:10) +
labs(list(y=" kg feed/kg gain ", x="Week"),size=18) +
theme_bw() +
theme(panel.border = element_blank(), panel.grid.major = element_blank(),
panel.grid.minor = element_blank(), axis.line = element_line(colour = "black"))+
theme(axis.text.x=element_text(angle=0, hjust=1,size=18),axis.text.y=element_text(angle=0, hjust=1,size=18)) +
scale_fill_brewer(type="qual", palette=2) +
scale_color_brewer(type="qual", palette=2) +
theme(axis.title.x = element_text( size=18))+
theme(axis.title.y = element_text(size=18))+
#ggtitle("Heritability over time")+
theme(legend.title=element_blank())+
guides(color = guide_legend(nrow=3))+
theme(legend.text = element_text(colour="blue", size = 16))+
theme(legend.key.size = unit(2,'lines'))+
theme(plot.title = element_text(lineheight=5, face="bold", color="black", size=16))
library(RColorBrewer)
myColors <- c("red","blue","red","blue","red","blue")
names(myColors) <- levels(mydata$group)
myline=c("dotdash","solid", "dotted","dotdash","solid", "dotted")
names(myline) <- levels(mydata$group)
colScale <- scale_colour_manual(name = "group",values = myColors)
lineScale <- scale_colour_manual(name = "group",values = myline)
#png(file="EBV_genkk.png",width=1000,height=800,res=100)
pp1+colScale
Scale for 'colour' is already present. Adding another scale for 'colour', which will replace the existing
scale.

#dev.off()
#+lineScale
---
title: "R Notebook"
output: html_notebook
---

This is an [R Markdown](http://rmarkdown.rstudio.com) Notebook. When you execute code within the notebook, the results appear beneath the code. 

Try executing this chunk by clicking the *Run* button within the chunk or by placing your cursor inside it and pressing *Ctrl+Shift+Enter*. 


```{r, echo=TRUE}




#PLot 1

library(ggplot2)

setwd("C:/Users/vhtran/Google Drive/these/diver_selection")
#png(file = "7.png", width = 800, height = 800)

library(readr)
mydata <- read.csv("C:/Users/vhtran/Google Drive/these/diver_selection/dataplot3.csv", sep=";")

ggplot(mydata, aes(x=generations, y=value, colour=group, group=group)) +
  
 
  geom_line(aes(linetype=as.factor(group1),color=as.factor(unit)),size=2) +
  
 
  
  geom_point(aes(fill = group,shape = group))+
  
  
  labs(list(y="value", x="generation"),size=20) +
  theme_bw() + 
  theme(panel.border = element_blank(), panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(), axis.line = element_line(colour = "black"))+
  
  theme(axis.text.x=element_text(angle=0, hjust=1,size=16),axis.text.y=element_text(angle=0, hjust=1,size=16)) +
  scale_fill_brewer(type="qual", palette=2) +
  scale_color_brewer(type="qual", palette=2) +
  theme(axis.title.x = element_text( size=18))+
  theme(axis.title.y = element_text(size=18))+
  
  #ggtitle("Heritability over time")+
  theme(legend.title=element_blank())+
  guides(color = guide_legend(nrow=3))+
  theme(legend.text = element_text(colour="blue", size = 16))+  
  theme(legend.key.size = unit(2, 'lines'))+
  theme(plot.title = element_text(lineheight=5, face="bold", color="black", size=20))

#dev.off()


```






```{r}
#Plot with EBV per week for each line-generation




 library(reshape2)
library(plyr)





mydata_1 <- read.table("C:/Users/vhtran/Google Drive/these/diver_selection/FULL4.dat",quote="\"") 
names(mydata_1)[1]<-"animal"  
names(mydata_1)[2]<-"identif" 
names(mydata_1)[3]<-"bande"  
names(mydata_1)[4]<-"sexe"  
names(mydata_1)[5]<-"lignee"  
names(mydata_1)[6]<-"gener"  
names(mydata_1)[7]<-"loge"  
names(mydata_1)[8]<-"eleve"  
names(mydata_1)[9]<- "pds_dc"  
names(mydata_1)[10]<-"pds_fc"  
names(mydata_1)[11]<-"age"  
names(mydata_1)[12]<-"poidsheb"  
names(mydata_1)[13]<-"poidpre2"  
names(mydata_1)[14]<-"age_dc"  
names(mydata_1)[15]<-"temps"  
names(mydata_1)[16]<-"consoheb"     
names(mydata_1)[17]<-"ADGv"  
names(mydata_1)[18]<-"FCRv"  
names(mydata_1)[19]<-"ADGg"  
names(mydata_1)[20]<-"FCRg"  
names(mydata_1)[21]<-"semaine"  
names(mydata_1)[22]<-"period"  




#mydata$temps=as.numeric(levels(mydata$temps))[mydata$temps]
#number animal

my1=mydata_1[,1:8]
my2=aggregate(my1, list(my1$animal), FUN=head, 1)
my2=arrange(my2,animal)










########################################################################################
# EBV for one records (mean of record)/ 3986 animals

EBV_all <- read.table("EBV_all1309.txt", quote="\"")



test<-melt(EBV_all,id.vars = 'animal')

test1=arrange(test,animal)
test1$EBV=test1$value

EBV_all1=test1[,c("animal","EBV")]

N_animal=length(unique(EBV_all1$animal))

EBV_all1$temps=c(rep(4:13,N_animal))


critere = c("animal")  


mydata_EBV=merge(EBV_all1,my2,by=c(critere))  
#class the animal
mydata_EBV1=arrange(mydata_EBV,animal,temps)  




#results from k-mean trajectory classification


#group A (generation G0-G2)
#group B (generation G3-G7 line HRFI)
#group C (generation G3-G7 line HRFI)

mydata_EBV1$gr=paste(mydata_EBV1$gener,mydata_EBV1$lignee,collapse =NULL)


mydata_EBV1$group =ifelse(mydata_EBV1$gener=="G0"|mydata_EBV1$gener=="G1"|mydata_EBV1$gener=="G2","C",
ifelse(mydata_EBV1$gr=="G3 +"|mydata_EBV1$gr=="G4 +"|mydata_EBV1$gr=="G5 +"|mydata_EBV1$gr=="G6 +"|
         mydata_EBV1$gr=="G7 +","B","A"))

# 
# library(dplyr)
# 
# gd <- mydata_EBV1 %>% 
#         group_by(group,temps) %>% 
#         summarise(
#           EBV.mean = mean(EBV),
#         
#         )
# 
# fix(gd)
# 
# 
# 
# gd$group1=ifelse(gd$group=="A","G0-G2",ifelse(gd$group=="B","G3-G7/HRFI","G3 to G7/LRFI"))


gd <- read.csv("C:/Users/vhtran/Google Drive/these/diver_selection/gd1.csv", sep=";")

gd$temps=gd$temps-3


library(ggplot2)

setwd("C:/Users/vhtran/Google Drive/these/diver_selection")
#png(file = "7.png", width = 800, height = 800)


diver_selec <- read.table("C:/Users/vhtran/Google Drive/these/Sujet2/out.txt", quote="\"")

mydata=diver_selec 
mydata$min=(mydata$EBV.mean-mydata$EBV.sd)
mydata$max=(mydata$EBV.mean+mydata$EBV.sd)

mydata$group1=paste(mydata$gener,mydata$lignee,collapse =NULL)

group=c(rep("C",50),rep("A",10),rep("B",10),rep("A",10),rep("B",10),rep("A",10),rep("B",10),
        rep("A",10),rep("B",10),rep("A",10),rep("B",10))
mydata=cbind(mydata,group)


mydata$temps=mydata$temps-3


mydata_plot=mydata[,c("group","temps","EBV.mean","group1")]

mydata_plot1 = rbind(mydata_plot,gd)

library(ggplot2)


#???pp=ggplot(mydata, aes(x=generations, y=value, colour=group, group=group)) +
  
pp1=  ggplot(mydata_plot1, aes(x=temps, y=EBV.mean, colour=group, group=group1)) +
  
  
 
geom_line(aes(linetype=group1, size = group1)) +  
  
   scale_linetype_manual(values=c("solid","solid","solid","solid",rep(c("solid","solid"),2),
                                  rep(c("dotted","twodash"),5))) +
   scale_size_manual(values=c(3,3,3,rep(0.5,15)))+
  
  
 # geom_line(data = gd) +
  
  geom_point(aes(fill = group1,shape = group1),   # Shape depends on cond
             size = 4) +        # Large points
  
  scale_shape_manual(values=c(1,1,1,1,5,6,7,8,rep(c(9,9,10,10,11,11,12,12,13,13),1))) +
 
  
 
 scale_x_continuous(breaks=1:10) +

labs(list(y="EBV (kg feed/kg gain)", x="Week"),size=24) +
  theme_bw() + 
  theme(panel.border = element_blank(), panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(), axis.line = element_line(colour = "black"))+
  
  theme(axis.text.x=element_text(angle=0, hjust=1,size=24),axis.text.y=element_text(angle=0, hjust=1,size=24)) +
  scale_fill_brewer(type="qual", palette=2) +
  scale_color_brewer(type="qual", palette=2) +
  theme(axis.title.x = element_text( size=24))+
  theme(axis.title.y = element_text(size=24))+
  
  #ggtitle("Heritability over time")+
  theme(legend.title=element_blank())+
  guides(color = guide_legend(nrow=3))+
  theme(legend.text = element_text(colour="blue", size = 20))+  
  theme(legend.key.size = unit(2, 'lines'))+
  theme(plot.title = element_text(lineheight=5, face="bold", color="black", size=20))


library(RColorBrewer)

myColors <- c("blue","red","green")
names(myColors) <- levels(mydata$group)

# myline=c("dotdash","solid", "dotted","dotdash","solid", "dotted")
# names(myline) <- levels(mydata$group)
# 

colScale <- scale_colour_manual(name = "group",values = myColors)
# lineScale <- scale_colour_manual(name = "group",values = myline)



#png(file="EBV_gene_week1.png",width=1800,height=1200,res=100)

pp1+colScale 


#dev.off()




















```

```{r}
# CUREVES SBV FOR GENERATIONS

library(ggplot2)

mydata<- read.csv("C:/Users/vhtran/Google Drive/these/diver_selection/dataplot3.csv", sep=";")
mydata=mydata[1:32,]

pp1=  ggplot(mydata, aes(x=generations, y=value, colour=group, group=group)) + 
  
  
  

geom_line(aes(linetype=group), # Line type depends on cond
          size = 1) +
  
  #geom_point(aes(fill = group,shape = group1),  
             geom_point(aes(fill = group,shape = group),size = 3) +
             
             # Shape depends on cond
                     # Large points
  
  
  
  scale_linetype_manual(values=c("dotted","dotted","solid", "solid")) +
  scale_shape_manual(values=c(8,8,1,1)) +
  
  #geom_line(data=dataplot, aes(x=generations, y=value, group=group,col=as.factor(group1),linetype=as.factor(group), scale_fill_manual(values=c("blue","red"))))
  
  #geom_line(aes(linetype=as.factor(group),color=as.factor(group)),size=2) +
  
  #geom_errorbar(aes(ymin=min, ymax=max, colour=group,linetype=group), width=.4,
  #  position=position_dodge(0.05))+
  
  
  
  



# scale_colour_manual(name="Error Bars",values=cols, guide = guide_legend(fill = NULL,colour = NULL)) + 
# scale_fill_manual(values=cols, guide="none") +


 #scale_x_continuous(breaks=1:10) +
  
  labs(list(y=" kg feed/kg gain ", x="Week"),size=18) +
  theme_bw() + 
  theme(panel.border = element_blank(), panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(), axis.line = element_line(colour = "black"))+
  
  theme(axis.text.x=element_text(angle=0, hjust=1,size=18),axis.text.y=element_text(angle=0, hjust=1,size=18)) +
  scale_fill_brewer(type="qual", palette=2) +
  scale_color_brewer(type="qual", palette=2) +
  theme(axis.title.x = element_text( size=18))+
  theme(axis.title.y = element_text(size=18))+
  
  #ggtitle("Heritability over time")+
  theme(legend.title=element_blank())+
  guides(color = guide_legend(nrow=3))+
  theme(legend.text = element_text(colour="blue", size = 16))+  
  theme(legend.key.size = unit(2,'lines'))+
  theme(plot.title = element_text(lineheight=5, face="bold", color="black", size=16))












library(RColorBrewer)

myColors <- c("red","blue","red","blue","red","blue")
names(myColors) <- levels(mydata$group)

myline=c("dotdash","solid", "dotted","dotdash","solid", "dotted")
names(myline) <- levels(mydata$group)


colScale <- scale_colour_manual(name = "group",values = myColors)

lineScale <- scale_colour_manual(name = "group",values = myline)



#png(file="EBV_genkk.png",width=1000,height=800,res=100)

pp1+colScale 

#dev.off()
#+lineScale


```

```{r, eval=FALSE, include=FALSE}

#TRAJECTORY CLASSIFICATION


#set wd
setwd("C:/Users/vhtran/Google Drive/these/diver_selection")
#save data
#save.image(file="18012017.RData")
#remove object
#rm(list=ls())
######################################################################################
#required packages
library(corrplot)
library(psych)
library(plyr)
library(stringr)
library(kml)
library(kml3d)
library(reshape)
library(SDMTools)
library(fmsb)
library(dplyr)
library(lsa)
library(readr)

# repet2 <- read.table("C:/Users/vhtran/Google Drive/these/data/repet2.dat")
#                     
# 
# 
# 
# 
# repet3=repet2[,c(1,6)]
# repet3=arrange(repet3,X1)

########################################################################

mydata <- read.table("C:/Users/vhtran/Google Drive/these/diver_selection/FULL4.dat",quote="\"") 
names(mydata)[1]<-"animal"  
names(mydata)[2]<-"identif" 
names(mydata)[3]<-"bande"  
names(mydata)[4]<-"sexe"  
names(mydata)[5]<-"lignee"  
names(mydata)[6]<-"gener"  
names(mydata)[7]<-"loge"  
names(mydata)[8]<-"eleve"  
names(mydata)[9]<- "pds_dc"  
names(mydata)[10]<-"pds_fc"  
names(mydata)[11]<-"age"  
names(mydata)[12]<-"poidsheb"  
names(mydata)[13]<-"poidpre2"  
names(mydata)[14]<-"age_dc"  
names(mydata)[15]<-"temps"  
names(mydata)[16]<-"consoheb"     
names(mydata)[17]<-"ADGv"  
names(mydata)[18]<-"FCRv"  
names(mydata)[19]<-"ADGg"  
names(mydata)[20]<-"FCRg"  
names(mydata)[21]<-"semaine"  
names(mydata)[22]<-"period"  




#mydata$temps=as.numeric(levels(mydata$temps))[mydata$temps]
#number animal

my1=mydata[,1:8]
my2=aggregate(my1, list(my1$animal), FUN=head, 1)
my2=arrange(my2,animal)



my2=arrange(my2,animal)






########################################################################################
# EBV for one records (mean of record)/ 3986 animals

EBV_all <- read.table("EBV_all1309.txt", quote="\"")



test<-melt(EBV_all,id.vars = 'animal')

test1=arrange(test,animal)
test1$EBV=test1$value

EBV_all1=test1[,c("animal","EBV")]

N_animal=length(unique(EBV_all1$animal))

EBV_all1$temps=c(rep(4:13,N_animal))






EBV_to <- read.table("C:/Users/vhtran/Google Drive/these/sujet2/total", quote="\"")



EBV_to1=EBV_to[2:4] # delete the first col


names(EBV_to1)[1]<-"animal"  
names(EBV_to1)[2]<-"EBVto" 
names(EBV_to1)[3]<-"SE_EBVto" 

EBV_to2=arrange(EBV_to1,animal)










###############################
#G <- read.table("C:/Users/vhtran/Desktop/G.txt",quote="\"")
#matrix G of RROP
G <- read.table("G_RROP1309",quote="\"") # old is G1
G=as.matrix(G)
#G=cov2cor(G) # transform Cov matrix to correlation matrix
###############################
#matrix G of SAD
G1 <- read.table("G_sad1309.txt",quote="\"") #old is G
G1=as.matrix(G1)
#G1=cov2cor(G1) # transform Cov matrix to correlation matrix
R=eigen(G, only.values = FALSE, EISPACK = FALSE)
R1=eigen(G1, only.values = FALSE, EISPACK = FALSE)
R$values



A=as.matrix(R1$values)
B=as.matrix(R1$vectors)



V=(R$vectors)
V1=(R1$vectors)
###############################

# Ka=matrix(c(0.1627E-01,  0.2445E-02 ,  0.2489E-03,
#             0.2445E-02,  0.2303E-01, -0.1748E-03,
#             0.2489E-03, -0.1748E-03 ,  0.3318E-02),3,3)

Ka=matrix(c(0.1652E-01, 0.1905E-02, -0.6185E-03,
0.1905E-02,  0.2197E-01, -0.2209E-02  ,
-0.6185E-03 ,-0.2209E-02 , 0.3119E-02),3,3)

Ka=t(Ka)
#Ka=cov2cor(Ka)
Kaei=eigen(Ka, only.values = F, EISPACK = FALSE)
Kaei

#eigence vector explain 54,38 % of the variation


G_RROP <- read.table("RROP_sln1309", quote="\"") # old G_RROP
a=as.character(G_RROP$V2)
G_RROP$tPhi = substring(a,1,1) 
G_RROP$animal=substring(a,3)
GOP=G_RROP[,c("animal","V3","tPhi")]
GOP=arrange(GOP,animal,tPhi)
GOP$ei1=rep(Kaei$vectors[,1],3986)
GOP$ei2=rep(Kaei$vectors[,2],3986) # add -
GOP$ei3=rep(Kaei$vectors[,3],3986)
mydata5=GOP
mydata6=arrange(mydata5,animal,tPhi)  
mydata7=ddply(mydata6, "animal", head, 3)
mydata7=arrange(mydata7,animal,tPhi)  


mydata7$E1=mydata7$V3*mydata7$ei1
mydata7$E2=mydata7$V3*mydata7$ei2
mydata7$E3=mydata7$V3*mydata7$ei3







#write.table(mydata7, "eigenK.xls", col=NA, sep="\t",dec=".")  #write data to a file
mydata8=ddply(mydata7,~animal,summarise,sum=sum(E1),mean=mean(E1),sd=sd(E1))
mydata9=ddply(mydata7,~animal,summarise,sum=sum(E2),mean=mean(E2),sd=sd(E2))
mydata10=ddply(mydata7,~animal,summarise,sum=sum(E3),mean=mean(E3),sd=sd(E3))

cor(mydata8$sum,mydata10$sum)





###############################

#file sln SAD
#read data SAD.sln , !!!attention drive
G_sad <- read.table("sln_sad1309", quote="\"") #old is G_sad
View(G_sad)
names(G_sad)<-c("V1","code","value","SE")
a = G_sad$code
elems <- unlist( strsplit(as.character(a)  , "\\." ) )
m <- as.data.frame(matrix( elems , ncol = 2 , byrow = TRUE ))
Gsad=cbind(G_sad,m)
names(Gsad)<-c("V1","code","value","SE","temps","animal")
Gsad$temps=as.numeric(levels(Gsad$temps))[Gsad$temps]
Gsad=arrange(Gsad,animal,temps)
N_animal=length(unique(Gsad$animal))  #number animal from SAD.sln


cor(Gsad$value,EBV_all1$EBV,method="spearman")


Gsad$e1=-rep(V1[,1],N_animal) # added -
Gsad$e2=-rep(V1[,2],N_animal)   #eigen G RROP/breeding values # added -
Gsad$e3=rep(V1[,3],N_animal)
Gsad$e4=rep(V1[,4],N_animal)

Gsad$E1=(Gsad$e1)*(Gsad$value) 
Gsad$E2=(Gsad$e2)*(Gsad$value) 
Gsad$E3=(Gsad$e3)*(Gsad$value)
Gsad$E4=(Gsad$e4)*(Gsad$value)


EBV_Gsad=ddply(Gsad,~animal,summarise,sum=sum(value),mean=mean(value),sd=sd(value))
EBV_Gsad1=ddply(Gsad,~animal,summarise,sum=sum(E1),mean=mean(E1),sd=sd(E1))
EBV_Gsad2=ddply(Gsad,~animal,summarise,sum=sum(E2),mean=mean(E2),sd=sd(E2))
EBV_Gsad3=ddply(Gsad,~animal,summarise,sum=sum(E3),mean=mean(E3),sd=sd(E3))
EBV_Gsad4=ddply(Gsad,~animal,summarise,sum=sum(E4),mean=mean(E4),sd=sd(E4))


################################################################################




EBV_all1$e1=-rep(V[,1],N_animal) 
EBV_all1$e2=-rep(V[,2],N_animal)   #eigen G RROP/breeding values
EBV_all1$e3=rep(V[,3],N_animal)
EBV_all1$e9=rep(V[,9],N_animal)
EBV_all1$e10=rep(V[,10],N_animal)


EBV_all1$in1_all=(EBV_all1$e1)*(EBV_all1$EBV)
EBV_all1$in2_all=(EBV_all1$e2)*(EBV_all1$EBV)
EBV_all1$in3_all=(EBV_all1$e3)*(EBV_all1$EBV)
EBV_all1$in9_all=(EBV_all1$e9)*(EBV_all1$EBV)
EBV_all1$in10_all=(EBV_all1$e10)*(EBV_all1$EBV)



Gsad_take=Gsad[,c("value","E1","E2","E3","E4")]


DF=data.frame(EBV_all1,Gsad_take)


EBV_all_single1=ddply(EBV_all1,~animal,summarise,sum=sum(EBV),mean=mean(EBV),sd=sd(EBV))
EBV_all_single2=ddply(EBV_all1,~animal,summarise,sum=sum(in1_all),mean=mean(in1_all),sd=sd(in1_all))
EBV_all_single3=ddply(EBV_all1,~animal,summarise,sum=sum(in2_all),mean=mean(in2_all),sd=sd(in2_all))
EBV_all_single4=ddply(EBV_all1,~animal,summarise,sum=sum(in3_all),mean=mean(in3_all),sd=sd(in3_all))
#EBV_all_single5=ddply(EBV_all1,~animal,summarise,sum=sum(in4_all),mean=mean(in4_all),sd=sd(in4_all))
EBV_all_single5=ddply(EBV_all1,~animal,summarise,sum=sum(in9_all),mean=mean(in9_all),sd=sd(in9_all))
EBV_all_single6=ddply(EBV_all1,~animal,summarise,sum=sum(in10_all),mean=mean(in10_all),sd=sd(in10_all))



EBV_to2$EBV_OP=EBV_all_single1$sum
EBV_to2$in1_all=EBV_all_single2$sum
EBV_to2$in2_all=EBV_all_single3$sum
EBV_to2$in3_all=EBV_all_single4$sum
EBV_to2$in9_all=EBV_all_single5$sum
EBV_to2$in10_all=EBV_all_single6$sum


EBV_to2$EBV_SAD=EBV_Gsad$sum
EBV_to2$E1=EBV_Gsad1$sum
EBV_to2$E2=EBV_Gsad2$sum
EBV_to2$E3=EBV_Gsad3$sum
EBV_to2$E4=EBV_Gsad4$sum
EBV_to2$e1_all=mydata8$sum
EBV_to2$e2_all=mydata9$sum
EBV_to2$e3_all=mydata10$sum

names(EBV_to2)



#write.table(EBV_to2, "EBVperiod.txt", col=NA, sep="\t",dec=".")  #write data to a file

critere = c(names(my2),names(EBV_to2))  
critere=critere[duplicated(critere)]     #critere pour merge 2 tableaux#  
mydata0=arrange(my2,animal,identif)  
#merge data to obtain 1 line/animal for SAD
mydata1=merge(mydata0,EBV_to2,by=c(critere))  
#class the animal
mydata1=arrange(mydata1,animal)  


animal=(rep(mydata1$animal,10))
identif=(rep(mydata1$animal,10))
DF_1=data.frame(animal,identif)
DF_2=arrange(DF_1,animal)


DF_2$temps=c(rep(4:13,1186))
DF_2=arrange(DF_2,animal,temps)



DF_3=merge(DF_2,DF,by=c("animal","temps"))  

DF0=arrange(DF_3,animal,temps)




EBV_to3=mydata1[,c("animal", "E1",      "E2"  , "EBV_SAD","e1_all","e2_all","EBV_OP",
                   "in1_all",  "in2_all","EBVto")]        

names(EBV_to3) <- c("animal", "SBV_SAD1", "SBV_SAD2", "sEBV_SAD","SBV_RRK1","SBV_RRK2","sEBV_RR","SBV_RR1","SBV_RR2","cEBV")
# 



corr.test(EBV_to3[,2:10])








######################################################################################

#classification DF

DF1=DF0[,c("animal","temps","EBV")]
DF2=reshape(DF1, varying = NULL, timevar = "temps", idvar = "animal", direction="wide", sep = "")



#predict the missing data using Linear interpolation/matrix
DF3=imputation(as.matrix(DF2[, 2:11]), method = "linearInterpol")

#prepared data for kml

cldDF3 <- cld(DF3, timeInData = 1:10)
#cld1

#kml with 3 groups, show only trajectories

kml(cldDF3, nbRedraw = 20,nbClusters=3, toPlot = "both")

kml(cldDF3)

kml(cldDF3, 3, parAlgo = parALGO(distance = function(x, y)
  cor(x, y), saveFreq = 10))

choice(cldDF3)

DF2$grEBV <- getClusters(cldDF3, 3)


#######################################################

DF4=DF0[,c("animal","temps","value")]
DF5=reshape(DF4, varying = NULL, timevar = "temps", idvar = "animal", direction="wide", sep = "")



#predict the missing data using Linear interpolation/matrix
DF6=imputation(as.matrix(DF5[, 2:11]), method = "linearInterpol")

#prepared data for kml

cldDF6 <- cld(DF6, timeInData = 1:10)
#cld1

#kml with 3 groups, show only trajectories

kml(cldDF6, nbRedraw = 20,nbClusters=3, toPlot = "traj")






kml(cldDF6)

kml(cldDF6, 3, parAlgo = parALGO(distance = function(x, y)
  cor(x, y), saveFreq = 10))

choice(cldDF6)

DF2$grEBV_SAD <- getClusters(cldDF6, 3)


###############################################################################


data_class=cbind(DF2,EBV_to3)
data_class$EBV=with(data_class,EBV4+EBV5+EBV6+EBV7+EBV8+EBV9+EBV10+EBV11+EBV12+EBV13)



data_class1 =cbind(my2,data_class)



```










