if(!require(tidyverse)){
install.packages("tidyverse")
}
## Loading required package: tidyverse
## ── Attaching packages ────────────────────────────────── tidyverse 1.2.1 ──
## ✔ ggplot2 2.2.1 ✔ purrr 0.2.4
## ✔ tibble 1.4.2 ✔ dplyr 0.7.4
## ✔ tidyr 0.8.0 ✔ stringr 1.3.0
## ✔ readr 1.1.1 ✔ forcats 0.3.0
## ── Conflicts ───────────────────────────────────── tidyverse_conflicts() ──
## ✖ dplyr::filter() masks stats::filter()
## ✖ dplyr::lag() masks stats::lag()
if(!require(SNPRelate)){
source("https://bioconductor.org/biocLite.R")
biocLite("SNPRelate")
}
## Loading required package: SNPRelate
## Loading required package: gdsfmt
## SNPRelate -- supported by Streaming SIMD Extensions 2 (SSE2)
set.seed(1680) # for reproducibility
if(!require(ISLR)) {
install.packages("ISLR")
}
## Loading required package: ISLR
if(!require(cluster)) {
install.packages("cluster")
}
## Loading required package: cluster
if(!require(Rtsne)) {
install.packages("Rtsne")
}
## Loading required package: Rtsne
library(cluster) # for gower similarity and pam
library(Rtsne) # for t-SNE plot
library(tidyverse)
library(SNPRelate)
library(reshape2)
##
## Attaching package: 'reshape2'
## The following object is masked from 'package:tidyr':
##
## smiths
set.seed(1680) # for reproducibility
first_analysis/populations.snps.vcf.filtered.for.non-presence.presumed.0.samplesOnly.txt is a modified populations.snps.vcf file
# cat first info columns
# get rid of "single" in the col names (sample names)
cat populations.snps.vcf | sed 's/.single//g' | tail -n +16 | cut -f10- | tr ":" "\t" | sed 's#0/1#0.5#g' | sed 's#0/0#0#g' | sed 's#1/1#1#g' > genotypes_and_coverage.01.txt # # convert genotypes from 0/1 format to 0.5 format
cat populations.snps.vcf | sed 's/.single//g' | tail -n +15 | cut -f10- | head -1 > sampleNames.txt
# read in bash-splitted file
genotypes_and_coverage<-read.delim("genotypes_and_coverage.01.txt", header = F, sep = '\t')
sample_names<-read.delim("sampleNames.txt", sep = "\t", header = TRUE, nrows=2)
names<-names(sample_names)
genotype_names_in_split <- paste(names, ".1.geno", sep="") # genotype names in split
coverage_names_in_split <- paste(names, ".2.cover", sep="") # coverage names in split
support_reads_names<- paste(names, ".3.support", sep="") # coverage supporting reads names in split
#bind 3 vectors
names_split <- sort(as.vector(rbind(genotype_names_in_split,coverage_names_in_split,support_reads_names))) # collate
names(genotypes_and_coverage)<-names_split
coverage_cols<-grepl("2.cover", names(genotypes_and_coverage))
genotype_cols<-grepl("1.geno", names(genotypes_and_coverage))
coverage<-genotypes_and_coverage[coverage_cols]
genotype<-genotypes_and_coverage[genotype_cols]
#genotype<- read.delim("genotype.01.txt", sep = "\t", header = TRUE)
t.coverage<-t(as.matrix(coverage))
t.genotype<-t(as.matrix(genotype))
Clustering - - coverage and genotype
# Applying Ward Hierarchical Clustering
d_coverage <- dist(t.coverage, method="euclidean")
ward_fit_coverage <- hclust(d_coverage, method="ward")
## The "ward" method has been renamed to "ward.D"; note new "ward.D2"
g4_ward_coverage <- cutree(ward_fit_coverage, k = c(4))
g8_ward_coverage <- cutree(ward_fit_coverage, k = c(8))
#using Gower via daisy
gower_dist_genotype <- daisy(t.genotype,
metric = "gower",
type = list(logratio = 3))
## Warning in daisy(t.genotype, metric = "gower", type = list(logratio = 3)):
## binary variable(s) 2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19,
## 20, 21, 22, 23, 24, 25, 26 treated as interval scaled
gower_mat_genotype <- as.matrix(gower_dist_genotype)
tsne_obj_genotype <- Rtsne(gower_dist_genotype, is_distance = TRUE)
pam_fit_genotype <- pam(gower_dist_genotype, diss = TRUE, k = 3)
tsne_data_genotype <- tsne_obj_genotype$Y %>%
data.frame() %>%
setNames(c("X", "Y")) %>%
mutate(cluster = factor(pam_fit_genotype$clustering),
name = row.names(t.genotype))
# Gower clusters for coverage:
gower_dist_coverage <- daisy(t.coverage,
metric = "gower",
type = list(logratio = 3))
gower_mat_coverage <- as.matrix(gower_dist_coverage)
tsne_obj_coverage <- Rtsne(gower_dist_coverage, is_distance = TRUE)
pam_fit_coverage <- pam(gower_dist_coverage, diss = TRUE, k = 3)
tsne_data_coverage <- tsne_obj_coverage$Y %>%
data.frame() %>%
setNames(c("X", "Y")) %>%
mutate(cluster = factor(pam_fit_coverage$clustering),
name = row.names(t.coverage))
Writing data out
write.table(tsne_data_genotype, file="genotype_clusters.csv", quote = FALSE, sep = ",")
write.table(g8_ward_coverage, file="coverage_groups.csv", quote = FALSE, sep = ",")
#write.table()
Plots: Ward clustered dendrogram for coverage:
plot(ward_fit_coverage)
Genotype clusters:
ggplot(aes(x = X, y = Y), data = tsne_data_genotype) +
geom_point(aes(color = cluster))
Samples in genotype clusters:
tsne_data_genotype
## X Y cluster name
## 1 -9.0275969 -6.24022771 1 P1_A01.1.geno
## 2 -8.5733970 -4.96771651 1 P1_A02.1.geno
## 3 2.9268395 -0.15391249 2 P1_A03.1.geno
## 4 3.6549049 2.75365209 2 P1_A04.1.geno
## 5 2.5982498 -0.83326148 2 P1_A05.1.geno
## 6 4.8746777 2.46090491 2 P1_A06.1.geno
## 7 4.1394616 1.04698684 2 P1_A07.1.geno
## 8 -3.6982637 -0.84295930 3 P1_A08.1.geno
## 9 -3.6982637 -0.84295930 3 P1_A09.1.geno
## 10 -8.5804480 -4.79813955 1 P1_A10.1.geno
## 11 3.1491796 3.92601472 2 P1_A11.1.geno
## 12 -3.6905131 -1.06522763 3 P1_A12.1.geno
## 13 -9.0256390 -6.23994384 1 P1_B01.1.geno
## 14 0.9942077 2.20661849 2 P1_B02.1.geno
## 15 1.3313714 -0.58053000 2 P1_B03.1.geno
## 16 -3.6905887 -1.06546154 3 P1_B04.1.geno
## 17 4.1349555 1.54191831 2 P1_B05.1.geno
## 18 1.2295602 2.70242443 2 P1_B06.1.geno
## 19 4.0070159 2.19271063 2 P1_B07.1.geno
## 20 1.5648114 0.37355042 2 P1_B08.1.geno
## 21 3.7217895 3.82947266 2 P1_B09.1.geno
## 22 3.7217895 3.82947266 2 P1_B10.1.geno
## 23 3.3431274 3.07648052 2 P1_B11.1.geno
## 24 3.9702056 2.27716388 2 P1_B12.1.geno
## 25 3.1376562 -0.95601103 2 P1_C01.1.geno
## 26 -9.0266415 -6.24052710 1 P1_C02.1.geno
## 27 0.7649760 3.37527338 2 P1_C03.1.geno
## 28 0.9872588 2.17177043 2 P1_C04.1.geno
## 29 2.8293319 -1.01990655 2 P1_C05.1.geno
## 30 -9.0260767 -6.24097859 1 P1_C06.1.geno
## 31 3.9788116 2.26280689 2 P1_C07.1.geno
## 32 -3.6660938 -0.89296383 3 P1_C08.1.geno
## 33 -9.0280735 -6.24084313 1 P1_C09.1.geno
## 34 2.3685632 1.91336634 2 P1_C10.1.geno
## 35 1.2263342 3.69217034 2 P1_C11.1.geno
## 36 1.3373933 2.80618602 2 P1_C12.1.geno
## 37 -9.0273296 -6.24062574 1 P1_D01.1.geno
## 38 -9.0275712 -6.24024982 1 P1_D02.1.geno
## 39 3.1114720 -0.16090742 2 P1_D03.1.geno
## 40 2.7847014 3.16177606 2 P1_D04.1.geno
## 41 2.5525417 3.98594002 2 P1_D05.1.geno
## 42 0.8795029 1.35354054 2 P1_D06.1.geno
## 43 2.1650138 3.96485462 2 P1_D07.1.geno
## 44 -9.3112805 -6.53371156 1 P1_D08.1.geno
## 45 0.9232555 -0.07103359 2 P1_D09.1.geno
## 46 -9.0273519 -6.24033613 1 P1_D11.1.geno
## 47 -8.5801521 -4.79810013 1 P1_D12.1.geno
## 48 4.6184305 -0.08891616 2 P1_E01.1.geno
## 49 2.2158735 -1.09501306 2 P1_E02.1.geno
## 50 1.5689882 2.95338811 2 P1_E03.1.geno
## 51 4.2704512 2.87709581 2 P1_E04.1.geno
## 52 1.7296677 -0.88897380 2 P1_E05.1.geno
## 53 -8.5762420 -4.96768769 1 P1_E06.1.geno
## 54 3.3055005 -0.12261126 2 P1_E07.1.geno
## 55 0.7499287 0.55361308 2 P1_E08.1.geno
## 56 -8.5735173 -4.96691769 1 P1_E09.1.geno
## 57 3.7310858 -0.76954903 2 P1_E11.1.geno
## 58 1.0489636 -0.16696390 2 P1_E12.1.geno
## 59 1.8737307 3.18954825 2 P1_F01.1.geno
## 60 -8.0880411 -6.24614431 1 P1_F02.1.geno
## 61 1.3146887 -0.40600607 2 P1_F03.1.geno
## 62 2.3346109 -0.07658695 2 P1_F04.1.geno
## 63 0.4630021 2.87624960 2 P1_F05.1.geno
## 64 2.1188688 3.14858559 2 P1_F06.1.geno
## 65 2.5579782 -0.14518007 2 P1_F07.1.geno
## 66 -7.8278075 -5.54217765 1 P1_F08.1.geno
## 67 2.0677735 1.58309762 2 P1_F09.1.geno
## 68 4.1397925 1.55229791 2 P1_F10.1.geno
## 69 2.7224988 -0.26913181 2 P1_F11.1.geno
## 70 0.3131316 1.94944681 2 P1_F12.1.geno
## 71 -8.9373169 -6.42994699 1 P1_G02.1.geno
## 72 4.3219183 3.47435494 2 P1_G03.1.geno
## 73 4.0429056 2.10404789 2 P1_G04.1.geno
## 74 -9.0247932 -6.23955247 1 P1_G05.1.geno
## 75 -3.9515518 -1.89563858 3 P1_G06.1.geno
## 76 4.3575570 3.48407411 2 P1_G07.1.geno
## 77 3.7314779 -0.76938854 2 P1_G08.1.geno
## 78 1.8774086 0.10978213 2 P1_G09.1.geno
## 79 4.3300604 0.87076909 2 P1_G10.1.geno
## 80 -9.0277630 -6.24046365 1 P1_G11.1.geno
## 81 4.3154816 -0.38037783 2 P1_G12.1.geno
## 82 1.6369589 0.33722983 2 P1_H01.1.geno
## 83 4.0202323 2.15109055 2 P1_H02.1.geno
## 84 2.0255979 0.01666963 2 P1_H03.1.geno
## 85 4.1487730 1.51988551 2 P1_H04.1.geno
## 86 4.6797385 2.59496588 2 P1_H05.1.geno
## 87 5.0076614 2.33669893 2 P1_H06.1.geno
## 88 -9.0270988 -6.24036010 1 P1_H07.1.geno
## 89 2.5639875 1.95336536 2 P1_H08.1.geno
## 90 3.6552628 2.75425953 2 P1_H09.1.geno
## 91 4.1497818 1.53310848 2 P1_H10.1.geno
## 92 3.2088069 -0.14482005 2 P1_H11.1.geno
## 93 2.7217290 3.17275003 2 P1_H12.1.geno
## 94 4.7029228 0.09445591 2 P2_A01.1.geno
## 95 2.6144339 3.12398529 2 P2_A02.1.geno
## 96 3.7762785 -0.01382083 2 P2_A03.1.geno
## 97 2.7475669 3.12306632 2 P2_A04.1.geno
## 98 -8.6287420 -4.76269251 1 P2_A05.1.geno
## 99 1.4802740 3.85705300 2 P2_A07.1.geno
## 100 0.7416349 1.77484588 2 P2_A08.1.geno
## 101 5.0896634 1.55863219 2 P2_A09.1.geno
## 102 2.0079887 3.15781604 2 P2_A10.1.geno
## 103 1.2648344 0.66580522 2 P2_A11.1.geno
## 104 2.5279215 -0.09189322 2 P2_A12.1.geno
## 105 -8.5728273 -4.96809034 1 P2_B01.1.geno
## 106 1.4263310 2.79706384 2 P2_B02.1.geno
## 107 0.8375271 1.49463950 2 P2_B06.1.geno
## 108 -3.6905474 -1.06551905 3 P2_B07.1.geno
## 109 1.0686268 2.30991037 2 P2_B08.1.geno
## 110 5.1579755 0.91296430 2 P2_B09.1.geno
## 111 2.9717290 1.44468930 2 P2_B10.1.geno
## 112 2.9240073 1.80293333 2 P2_B11.1.geno
## 113 3.1477670 1.52029401 2 P2_B12.1.geno
## 114 1.4096462 0.51150246 2 P2_C02.1.geno
## 115 -0.7491210 0.37500260 2 P2_C03.1.geno
## 116 -1.0776133 0.24301716 3 P2_C05.1.geno
## 117 -0.8751639 0.32482837 2 P2_C07.1.geno
## 118 2.9696054 1.74972021 2 P2_C08.1.geno
## 119 2.8801045 1.85067619 2 P2_C09.1.geno
## 120 3.1079887 1.57243056 2 P2_C12.1.geno
## 121 3.0500855 1.61074713 2 P2_D03.1.geno
## 122 3.0240369 1.67103113 2 P2_D04.1.geno
## 123 2.8801044 1.85067633 2 P2_D05.1.geno
## 124 -9.0270405 -6.24018859 1 P2_D06.1.geno
## 125 -9.0281172 -6.24009170 1 P2_D07.1.geno
## 126 -9.0274075 -6.23958213 1 P2_D08.1.geno
## 127 3.0500855 1.61074713 2 P2_D09.1.geno
## 128 -9.0264096 -6.24011622 1 P2_E01.1.geno
## 129 2.2744632 1.83348594 2 P2_E02.1.geno
## 130 2.8801044 1.85067633 2 P2_E03.1.geno
## 131 -3.6905787 -1.06555795 3 P2_E05.1.geno
## 132 0.3703816 1.41633192 2 P2_E06.1.geno
## 133 -9.3140770 -6.57432986 1 P2_E09.1.geno
## 134 2.8586769 1.62368343 2 P2_E11.1.geno
## 135 2.7507631 1.91377530 2 P2_E12.1.geno
## 136 -9.0282985 -6.24013499 1 P2_F02.1.geno
## 137 2.8083848 1.89093691 2 P2_F03.1.geno
## 138 -3.6905787 -1.06555798 3 P2_F04.1.geno
## 139 2.5510461 1.95719568 2 P2_F05.1.geno
## 140 2.8759021 1.28507992 2 P2_F06.1.geno
## 141 2.5239082 1.94794736 2 P2_F08.1.geno
## 142 2.8069071 1.22124777 2 P2_F09.1.geno
## 143 2.8759021 1.28507992 2 P2_G03.1.geno
## 144 4.1341917 2.96918304 2 P2_G05.1.geno
## 145 2.3072956 1.65591711 2 P2_G06.1.geno
## 146 -9.0279052 -6.23964932 1 P2_G09.1.geno
## 147 2.4155908 1.15556826 2 P2_H01.1.geno
## 148 2.4097797 1.15128897 2 P2_H02.1.geno
## 149 2.3056422 1.65361846 2 P2_H04.1.geno
## 150 2.3225646 1.52098758 2 P2_H05.1.geno
## 151 2.5658402 1.94999778 2 P2_H06.1.geno
## 152 2.3685634 1.91336642 2 P2_H07.1.geno
## 153 2.7899187 1.20341811 2 P2_H08.1.geno
## 154 2.0691820 1.57483365 2 P2_H09.1.geno
## 155 -8.5735094 -4.96780277 1 P3_A01.1.geno
## 156 -7.9330737 -4.25241156 3 P3_A02.1.geno
## 157 2.8016030 1.21507996 2 P3_A03.1.geno
## 158 -9.0277258 -6.24036628 1 P3_A04.1.geno
## 159 2.7916814 1.20607991 2 P3_A05.1.geno
## 160 2.0611301 1.53768271 2 P3_A06.1.geno
## 161 2.0617646 1.57769428 2 P3_A07.1.geno
## 162 2.7963708 1.21031253 2 P3_A08.1.geno
## 163 2.5196929 1.94290661 2 P3_A09.1.geno
## 164 -9.0327126 -6.24055727 1 P3_A10.1.geno
## 165 2.4872640 1.93737460 2 P3_A11.1.geno
## 166 2.0604123 1.51662385 2 P3_A12.1.geno
## 167 2.7900810 1.20355151 2 P3_B01.1.geno
## 168 2.7912845 1.20574883 2 P3_B02.1.geno
## 169 -9.0279131 -6.24066640 1 P3_B03.1.geno
## 170 2.3780718 1.18039530 2 P3_B04.1.geno
## 171 2.3802405 1.17681375 2 P3_B05.1.geno
## 172 2.3011277 1.65867205 2 P3_B06.1.geno
## 173 2.3940047 1.16786437 2 P3_B07.1.geno
## 174 2.3041390 1.67022258 2 P3_B08.1.geno
## 175 2.3828779 1.17491536 2 P3_B09.1.geno
## 176 2.7911646 1.20579015 2 P3_B10.1.geno
## 177 2.3984600 1.16567284 2 P3_B11.1.geno
## 178 2.1028964 1.58480396 2 P3_B12.1.geno
## 179 -8.5746671 -4.96724385 1 P3_C01.1.geno
## 180 -8.5736302 -4.96765507 1 P3_C02.1.geno
## 181 2.3778296 1.17853690 2 P3_C03.1.geno
## 182 2.7897206 1.20324511 2 P3_C04.1.geno
## 183 2.3726923 1.18570770 2 P3_C05.1.geno
## 184 -9.0273011 -6.24008951 1 P3_C06.1.geno
## 185 2.3110630 1.70095964 2 P3_C07.1.geno
## 186 2.4934746 1.93886644 2 P3_C08.1.geno
## 187 2.7885075 1.20212452 2 P3_C09.1.geno
## 188 2.5017396 1.93889452 2 P3_C10.1.geno
## 189 2.4025124 1.16264517 2 P3_D01.1.geno
## 190 2.3752404 1.18019721 2 P3_D02.1.geno
## 191 2.7883642 1.20219369 2 P3_D03.1.geno
## 192 2.4101002 1.15785168 2 P3_D05.1.geno
## 193 2.3044205 1.64603358 2 P3_D06.1.geno
## 194 2.7881881 1.20193354 2 P3_D07.1.geno
## 195 2.3750859 1.90939091 2 P3_D08.1.geno
## 196 2.0677735 1.58309763 2 P3_D09.1.geno
## 197 2.3788172 1.17765871 2 P3_D11.1.geno
## 198 2.0605935 1.51482458 2 P3_D12.1.geno
## 199 0.4989277 0.88597621 2 P3_E02.1.geno
## 200 2.0677735 1.58309763 2 P3_E03.1.geno
## 201 -8.4019993 -6.27575317 1 P3_E04.1.geno
## 202 2.0558517 1.49582135 2 P3_E05.1.geno
## 203 2.3773102 1.17891834 2 P3_E06.1.geno
## 204 2.7904144 1.20513854 2 P3_E07.1.geno
## 205 -7.6445891 -5.43026810 1 P3_F01.1.geno
## 206 -9.0278578 -6.24037685 1 P3_F04.1.geno
## 207 2.7900810 1.20355151 2 P3_F05.1.geno
## 208 2.7921867 1.20792339 2 P3_F08.1.geno
## 209 2.3072956 1.65591711 2 P3_F12.1.geno
## 210 2.7967705 1.21113663 2 P3_G02.1.geno
## 211 2.7938769 1.20784580 2 P3_G03.1.geno
## 212 2.3685412 1.91335675 2 P3_G04.1.geno
## 213 2.8202966 1.88060830 2 P3_G05.1.geno
## 214 2.3782135 1.18147777 2 P3_G06.1.geno
## 215 2.9057950 1.82422912 2 P3_H05.1.geno
## 216 -8.5743118 -4.96743109 1 P4_A01.1.geno
## 217 -3.6906417 -1.06553534 3 P4_A02.1.geno
## 218 3.0500855 1.61074713 2 P4_A03.1.geno
## 219 -8.5745503 -4.96773118 1 P4_A07.1.geno
## 220 -0.6263837 1.62647795 1 P4_A08.1.geno
## 221 -8.5745524 -4.96785098 1 P4_A09.1.geno
## 222 2.9626916 1.75981460 2 P4_A10.1.geno
## 223 -3.9513876 -1.89613851 3 P4_A11.1.geno
## 224 2.8415762 1.86822298 2 P4_A12.1.geno
## 225 -3.6905950 -1.06553352 3 P4_B01.1.geno
## 226 -8.5739543 -4.96756009 1 P4_B02.1.geno
## 227 -8.5734954 -4.96735406 1 P4_B03.1.geno
## 228 -3.6905765 -1.06559958 3 P4_B05.1.geno
## 229 3.0500855 1.61074713 2 P4_B06.1.geno
## 230 2.8586769 1.62368343 2 P4_B07.1.geno
## 231 3.0500855 1.61074713 2 P4_B08.1.geno
## 232 2.9595015 1.76359907 2 P4_B09.1.geno
## 233 2.3056435 1.65362293 2 P4_B11.1.geno
## 234 4.9702665 1.10859804 2 P4_B12.1.geno
## 235 1.7749188 0.17313048 2 P4_C03.1.geno
## 236 -9.0275579 -6.24041697 1 P4_C04.1.geno
## 237 0.8787586 1.35096512 2 P4_C05.1.geno
## 238 -0.7491210 0.37500260 2 P4_C06.1.geno
## 239 -3.6904313 -1.06555768 3 P4_C07.1.geno
## 240 0.7552745 0.64838149 2 P4_C08.1.geno
## 241 5.0236349 0.64998647 2 P4_C10.1.geno
## 242 -3.6904160 -1.06571476 3 P4_C11.1.geno
## 243 3.5771857 -0.08810084 2 P4_D01.1.geno
## 244 1.9019138 -0.66659642 2 P4_D02.1.geno
## 245 1.2091785 0.83097429 2 P4_D03.1.geno
## 246 -8.5751149 -4.96763257 1 P4_D04.1.geno
## 247 2.8020909 3.16361634 2 P4_D05.1.geno
## 248 -3.6660946 -0.89296444 3 P4_D06.1.geno
## 249 2.0569492 0.01530520 2 P4_D07.1.geno
## 250 -3.6905787 -1.06555795 3 P4_D08.1.geno
## 251 4.2385135 0.87073660 2 P4_D09.1.geno
## 252 -3.6905787 -1.06555795 3 P4_D11.1.geno
## 253 -9.0269296 -6.24022086 1 P4_D12.1.geno
## 254 4.2385175 0.87084449 2 P4_E01.1.geno
## 255 -8.5735148 -4.96710751 1 P4_E02.1.geno
## 256 -3.6906666 -1.06556599 3 P4_E03.1.geno
## 257 -3.5817761 -1.67893252 3 P4_E04.1.geno
## 258 1.8618528 3.09287285 2 P4_E05.1.geno
## 259 -3.8635711 -1.98807280 3 P4_E06.1.geno
## 260 -3.6906665 -1.06556600 3 P4_E07.1.geno
## 261 1.0247974 2.43430961 2 P4_E08.1.geno
## 262 -3.6886429 -1.06615687 3 P4_E09.1.geno
## 263 1.3668937 2.75336571 2 P4_E11.1.geno
## 264 1.8162512 3.18445138 2 P4_E12.1.geno
## 265 1.2054666 0.80991627 2 P4_F01.1.geno
## 266 -3.6905787 -1.06555798 3 P4_F02.1.geno
## 267 -3.9513908 -1.89646382 3 P4_F03.1.geno
## 268 5.1095536 1.72668421 2 P4_F04.1.geno
## 269 0.3165625 2.43321308 2 P4_F05.1.geno
## 270 -8.5740386 -4.96785630 1 P4_F06.1.geno
## 271 -3.5817834 -1.67893295 3 P4_F07.1.geno
## 272 0.8090803 0.48165025 2 P4_F08.1.geno
## 273 2.2746997 3.91637675 2 P4_F09.1.geno
## 274 0.9803535 1.39106430 2 P4_F10.1.geno
## 275 4.4735213 1.72886380 2 P4_F12.1.geno
## 276 3.9009319 0.41285273 2 P4_G01.1.geno
## 277 0.9462675 2.07131684 2 P4_G07.1.geno
## 278 3.0255228 3.98400414 2 P4_G09.1.geno
## 279 0.8333512 1.49901766 2 P4_G11.1.geno
## 280 3.6503445 2.79681279 2 P4_H01.1.geno
## 281 3.3376689 3.07181055 2 P4_H06.1.geno
## 282 3.3376689 3.07181055 2 P4_H07.1.geno
## 283 3.9008000 0.41264478 2 P4_H09.1.geno
## 284 3.9007959 0.41263820 2 P4_H10.1.geno
## 285 3.9007959 0.41263820 2 P4_H11.1.geno
## 286 2.3768538 1.91415786 2 P4_H12.1.geno
Coverage Gower clusters:
ggplot(aes(x = X, y = Y), data = tsne_data_coverage) +
geom_point(aes(color = cluster))
Samples and coverage clusters:
tsne_data_coverage
## X Y cluster name
## 1 2.321135808 -2.7608904 1 P1_A01.2.cover
## 2 3.526319455 -3.6701296 1 P1_A02.2.cover
## 3 -0.304493267 8.0936922 2 P1_A03.2.cover
## 4 1.906156900 5.5102565 2 P1_A04.2.cover
## 5 2.204881296 6.4435140 2 P1_A05.2.cover
## 6 1.823113474 7.0934428 2 P1_A06.2.cover
## 7 0.906990417 -1.1471230 2 P1_A07.2.cover
## 8 3.501086312 -0.6044907 2 P1_A08.2.cover
## 9 -1.372189768 -7.2863522 2 P1_A09.2.cover
## 10 3.970247812 -2.4124510 2 P1_A10.2.cover
## 11 -0.511700897 -7.0082746 2 P1_A11.2.cover
## 12 3.157686623 -0.7141103 2 P1_A12.2.cover
## 13 0.678915099 -6.4289555 3 P1_B01.2.cover
## 14 -1.647758862 1.9869954 2 P1_B02.2.cover
## 15 -1.064203919 -7.0420491 2 P1_B03.2.cover
## 16 0.666344473 -8.0640674 3 P1_B04.2.cover
## 17 -2.636081774 -0.4598821 2 P1_B05.2.cover
## 18 1.099813180 6.6060573 2 P1_B06.2.cover
## 19 -1.085868884 6.9687945 2 P1_B07.2.cover
## 20 -1.189898668 7.5906013 2 P1_B08.2.cover
## 21 0.345613796 1.8874242 2 P1_B09.2.cover
## 22 -7.758437585 -1.1134272 2 P1_B10.2.cover
## 23 -1.112694860 1.7951857 2 P1_B11.2.cover
## 24 0.860834285 2.1879836 2 P1_B12.2.cover
## 25 -0.684918926 4.7954035 2 P1_C01.2.cover
## 26 0.803717781 -6.4293236 1 P1_C02.2.cover
## 27 1.954666864 0.2104642 2 P1_C03.2.cover
## 28 -1.905704210 7.4314508 2 P1_C04.2.cover
## 29 -0.841211762 -7.1821594 2 P1_C05.2.cover
## 30 3.027152973 -6.0494523 1 P1_C06.2.cover
## 31 -2.613197469 -0.4682609 2 P1_C07.2.cover
## 32 2.161462284 -8.2635364 3 P1_C08.2.cover
## 33 0.688867832 -2.7057058 2 P1_C09.2.cover
## 34 -1.754615187 6.6926100 2 P1_C10.2.cover
## 35 1.323288290 2.5018145 2 P1_C11.2.cover
## 36 1.947532133 0.2111850 2 P1_C12.2.cover
## 37 2.765247062 -6.6289434 1 P1_D01.2.cover
## 38 1.890069002 -2.8121306 2 P1_D02.2.cover
## 39 -2.621614422 -0.4681622 2 P1_D03.2.cover
## 40 1.859462967 2.8269876 2 P1_D04.2.cover
## 41 -2.162372636 2.2923544 2 P1_D05.2.cover
## 42 0.789700931 -5.9769077 2 P1_D06.2.cover
## 43 -0.813057620 -6.2270641 2 P1_D07.2.cover
## 44 0.688899961 -2.7057331 2 P1_D08.2.cover
## 45 -1.299532410 -6.9379705 2 P1_D09.2.cover
## 46 0.599022729 -2.6036229 2 P1_D11.2.cover
## 47 1.797900303 -6.5485186 1 P1_D12.2.cover
## 48 -0.320646172 3.0565131 2 P1_E01.2.cover
## 49 -1.111558461 4.5327546 2 P1_E02.2.cover
## 50 0.854715380 -2.8478152 2 P1_E03.2.cover
## 51 0.599022729 -2.6036229 2 P1_E04.2.cover
## 52 -0.338006653 5.7762591 2 P1_E05.2.cover
## 53 4.311341910 -3.9429290 1 P1_E06.2.cover
## 54 4.526726526 -0.7538916 2 P1_E07.2.cover
## 55 4.865761003 -1.0268600 2 P1_E08.2.cover
## 56 3.597382874 -2.5319809 2 P1_E09.2.cover
## 57 -1.308150440 5.1810599 2 P1_E11.2.cover
## 58 0.863284223 4.8814355 2 P1_E12.2.cover
## 59 -1.006530100 5.5466317 2 P1_F01.2.cover
## 60 3.141676748 -6.4841634 1 P1_F02.2.cover
## 61 1.795794781 -9.1072089 3 P1_F03.2.cover
## 62 0.563255522 -2.5399608 2 P1_F04.2.cover
## 63 -0.056163904 5.6481575 2 P1_F05.2.cover
## 64 -1.389072780 5.1080784 2 P1_F06.2.cover
## 65 0.925757684 4.4894900 2 P1_F07.2.cover
## 66 3.769908747 -3.7954007 1 P1_F08.2.cover
## 67 -1.215468523 5.2520286 2 P1_F09.2.cover
## 68 4.531526866 -0.7067873 2 P1_F10.2.cover
## 69 -1.255071615 4.5983421 2 P1_F11.2.cover
## 70 2.037420041 0.0821602 2 P1_F12.2.cover
## 71 3.968131305 -3.3494962 1 P1_G02.2.cover
## 72 -0.347948225 -8.3738984 3 P1_G03.2.cover
## 73 0.549447213 4.3421509 2 P1_G04.2.cover
## 74 0.751212210 -6.4843162 3 P1_G05.2.cover
## 75 3.267288067 -3.4840352 1 P1_G06.2.cover
## 76 -7.571272298 -1.2803511 2 P1_G07.2.cover
## 77 0.951168239 -1.5347746 2 P1_G08.2.cover
## 78 1.406855043 -8.8355559 3 P1_G09.2.cover
## 79 -1.641001597 4.4388198 2 P1_G10.2.cover
## 80 0.627137759 -6.5477911 3 P1_G11.2.cover
## 81 0.401116174 5.3317578 2 P1_G12.2.cover
## 82 -1.680189184 3.8088080 2 P1_H01.2.cover
## 83 0.009611071 4.5765861 2 P1_H02.2.cover
## 84 4.517078707 -1.7442236 2 P1_H03.2.cover
## 85 0.282804513 4.0629617 2 P1_H04.2.cover
## 86 0.730885544 3.6037739 2 P1_H05.2.cover
## 87 -0.769916005 4.0922723 2 P1_H06.2.cover
## 88 0.782921799 -6.0694511 1 P1_H07.2.cover
## 89 -0.841211762 -7.1821594 2 P1_H08.2.cover
## 90 -0.836597798 4.5839672 2 P1_H09.2.cover
## 91 -2.640185111 -0.4674640 2 P1_H10.2.cover
## 92 -2.638516129 -0.4641206 2 P1_H11.2.cover
## 93 -1.643830100 3.8821907 2 P1_H12.2.cover
## 94 0.395565499 3.4065407 2 P2_A01.2.cover
## 95 -0.274238889 1.5541598 2 P2_A02.2.cover
## 96 -1.443627030 3.6075169 2 P2_A03.2.cover
## 97 1.958488106 0.2131681 2 P2_A04.2.cover
## 98 4.258177623 -3.9274588 1 P2_A05.2.cover
## 99 -0.904909633 3.1199899 2 P2_A07.2.cover
## 100 -2.638439516 -0.4641671 2 P2_A08.2.cover
## 101 -1.067269315 3.9479990 2 P2_A09.2.cover
## 102 -0.531273646 4.0355613 2 P2_A10.2.cover
## 103 -0.466861931 4.0096596 2 P2_A11.2.cover
## 104 -0.928262608 3.1582377 2 P2_A12.2.cover
## 105 1.713819332 -6.8217929 3 P2_B01.2.cover
## 106 -2.633156532 -0.4678006 2 P2_B02.2.cover
## 107 -0.553028293 4.8060244 2 P2_B06.2.cover
## 108 4.696143570 -1.8131258 2 P2_B07.2.cover
## 109 0.424948184 3.3810940 2 P2_B08.2.cover
## 110 0.645120691 -2.6572138 2 P2_B09.2.cover
## 111 -0.180675524 2.9331727 2 P2_B10.2.cover
## 112 -1.405984658 3.4936793 2 P2_B11.2.cover
## 113 -0.290145711 4.2041360 2 P2_B12.2.cover
## 114 0.262470099 4.3386082 2 P2_C02.2.cover
## 115 -7.831665261 -1.0381231 2 P2_C03.2.cover
## 116 1.985013665 -8.8241810 3 P2_C05.2.cover
## 117 -1.510251722 -7.0383614 2 P2_C07.2.cover
## 118 -0.418120283 5.0318927 2 P2_C08.2.cover
## 119 -0.861785800 4.1586807 2 P2_C09.2.cover
## 120 -0.071228167 3.9549265 2 P2_C12.2.cover
## 121 -0.984305143 3.5743174 2 P2_D03.2.cover
## 122 -0.923532813 3.1631168 2 P2_D04.2.cover
## 123 -7.353633241 -1.4551700 2 P2_D05.2.cover
## 124 2.385058560 -2.7933243 1 P2_D06.2.cover
## 125 0.599022729 -2.6036229 2 P2_D07.2.cover
## 126 0.429068346 -4.9558022 2 P2_D08.2.cover
## 127 0.688899961 -2.7057331 2 P2_D09.2.cover
## 128 1.624938010 -5.9992277 1 P2_E01.2.cover
## 129 2.190286469 -0.6455248 2 P2_E02.2.cover
## 130 -1.212810685 3.3163018 2 P2_E03.2.cover
## 131 2.287028719 -8.5256313 3 P2_E05.2.cover
## 132 1.858864847 -7.8871059 3 P2_E06.2.cover
## 133 2.231152193 -2.8305272 1 P2_E09.2.cover
## 134 -0.024322061 3.1997285 2 P2_E11.2.cover
## 135 -0.467146826 3.9896287 2 P2_E12.2.cover
## 136 0.974504623 -3.0736739 2 P2_F02.2.cover
## 137 -0.626300210 4.8431420 2 P2_F03.2.cover
## 138 1.925243845 -8.7449478 3 P2_F04.2.cover
## 139 0.674440278 -5.3289569 1 P2_F05.2.cover
## 140 1.954666864 0.2104642 2 P2_F06.2.cover
## 141 4.922750245 -0.9981700 2 P2_F08.2.cover
## 142 -7.831665261 -1.0381231 2 P2_F09.2.cover
## 143 0.055651882 4.5230883 2 P2_G03.2.cover
## 144 -0.001337382 7.4985241 2 P2_G05.2.cover
## 145 -7.311041041 -1.5349120 2 P2_G06.2.cover
## 146 3.243965434 -7.3871159 1 P2_G09.2.cover
## 147 -2.815071366 5.2049257 2 P2_H01.2.cover
## 148 2.591801727 5.8561331 2 P2_H02.2.cover
## 149 -7.831665261 -1.0381231 2 P2_H04.2.cover
## 150 2.788524043 3.6115980 2 P2_H05.2.cover
## 151 -3.242815073 3.7269274 2 P2_H06.2.cover
## 152 -0.443080587 7.0071192 2 P2_H07.2.cover
## 153 -7.673750469 -1.1956287 2 P2_H08.2.cover
## 154 2.054299503 3.3381049 2 P2_H09.2.cover
## 155 4.188255864 -4.6404490 1 P3_A01.2.cover
## 156 1.097574108 -7.7443875 1 P3_A02.2.cover
## 157 0.582485988 3.6184525 2 P3_A03.2.cover
## 158 1.923555626 -2.8471908 2 P3_A04.2.cover
## 159 1.079120265 7.6590678 2 P3_A05.2.cover
## 160 -2.682481769 3.0396274 2 P3_A06.2.cover
## 161 -0.326614384 5.7443451 2 P3_A07.2.cover
## 162 -0.470047085 5.7329112 2 P3_A08.2.cover
## 163 -1.536276662 4.4757395 2 P3_A09.2.cover
## 164 0.705595980 -6.5146896 1 P3_A10.2.cover
## 165 -1.679072818 4.7114490 2 P3_A11.2.cover
## 166 1.928882681 0.2149269 2 P3_A12.2.cover
## 167 -7.353633241 -1.4551700 2 P3_B01.2.cover
## 168 -0.901134087 3.3552713 2 P3_B02.2.cover
## 169 0.688911167 -2.7057523 2 P3_B03.2.cover
## 170 0.066848246 4.6171414 2 P3_B04.2.cover
## 171 0.346672978 3.3463484 2 P3_B05.2.cover
## 172 0.649171840 3.5112414 2 P3_B06.2.cover
## 173 -0.470191680 2.9650357 2 P3_B07.2.cover
## 174 -0.564388379 3.8795569 2 P3_B08.2.cover
## 175 0.137727727 3.4008502 2 P3_B09.2.cover
## 176 0.731692476 5.0692159 2 P3_B10.2.cover
## 177 -0.035920744 3.1683376 2 P3_B11.2.cover
## 178 -0.299011225 2.9620135 2 P3_B12.2.cover
## 179 3.547737471 -8.0549063 3 P3_C01.2.cover
## 180 1.605601242 -6.5511072 3 P3_C02.2.cover
## 181 0.264852879 3.5809131 2 P3_C03.2.cover
## 182 0.685692394 4.3575913 2 P3_C04.2.cover
## 183 -0.210367888 4.9918243 2 P3_C05.2.cover
## 184 0.688833462 -2.7056786 2 P3_C06.2.cover
## 185 0.109955006 5.1606346 2 P3_C07.2.cover
## 186 0.014605621 5.0865860 2 P3_C08.2.cover
## 187 -1.031198346 4.0944428 2 P3_C09.2.cover
## 188 -0.282669830 4.1308575 2 P3_C10.2.cover
## 189 0.531598230 5.2069516 2 P3_D01.2.cover
## 190 -2.633336417 -0.4525126 2 P3_D02.2.cover
## 191 0.921017769 4.1543390 2 P3_D03.2.cover
## 192 0.936519824 4.1501419 2 P3_D05.2.cover
## 193 -0.515832940 3.4743553 2 P3_D06.2.cover
## 194 -1.455625440 3.6453424 2 P3_D07.2.cover
## 195 0.871357682 4.0372284 2 P3_D08.2.cover
## 196 0.329323287 4.6152519 2 P3_D09.2.cover
## 197 -7.831665261 -1.0381231 2 P3_D11.2.cover
## 198 -0.767422705 4.9075337 2 P3_D12.2.cover
## 199 -1.628579356 4.1166996 2 P3_E02.2.cover
## 200 -0.856592428 -7.3956066 2 P3_E03.2.cover
## 201 2.096626485 -1.5593516 1 P3_E04.2.cover
## 202 -0.409480898 4.9519151 2 P3_E05.2.cover
## 203 0.862031589 4.8505265 2 P3_E06.2.cover
## 204 -1.530643637 4.4260906 2 P3_E07.2.cover
## 205 3.749094680 -3.7561043 1 P3_F01.2.cover
## 206 4.091527824 -4.0699451 1 P3_F04.2.cover
## 207 -1.384804513 5.1243791 2 P3_F05.2.cover
## 208 -1.553696453 4.4819464 2 P3_F08.2.cover
## 209 0.372206663 5.3990392 2 P3_F12.2.cover
## 210 -1.374158898 5.1766933 2 P3_G02.2.cover
## 211 -0.873864903 5.5188804 2 P3_G03.2.cover
## 212 -0.347268689 5.0703958 2 P3_G04.2.cover
## 213 -0.065879072 5.7151065 2 P3_G05.2.cover
## 214 0.363568669 5.4536998 2 P3_G06.2.cover
## 215 -1.050752064 5.5314945 2 P3_H05.2.cover
## 216 2.934752660 -6.3495238 1 P4_A01.2.cover
## 217 2.779643915 -8.5190919 3 P4_A02.2.cover
## 218 -7.353588577 -1.4552001 2 P4_A03.2.cover
## 219 3.475660469 -2.7349111 2 P4_A07.2.cover
## 220 0.481398838 -5.9874971 2 P4_A08.2.cover
## 221 3.261447852 -7.9954863 3 P4_A09.2.cover
## 222 -0.751644788 -7.6434117 2 P4_A10.2.cover
## 223 2.696902202 -7.3736888 1 P4_A11.2.cover
## 224 -1.071825560 5.5494477 2 P4_A12.2.cover
## 225 1.523443813 -8.6422740 3 P4_B01.2.cover
## 226 1.807229060 -6.8760777 3 P4_B02.2.cover
## 227 3.359792972 -7.7880820 3 P4_B03.2.cover
## 228 3.237507800 -0.8532339 1 P4_B05.2.cover
## 229 -3.308167810 6.0443123 2 P4_B06.2.cover
## 230 4.529133141 -0.8119465 2 P4_B07.2.cover
## 231 3.068487552 5.0148975 2 P4_B08.2.cover
## 232 -1.276504671 -6.7962811 2 P4_B09.2.cover
## 233 0.066875519 -7.1589750 3 P4_B11.2.cover
## 234 -3.435611757 3.0014339 2 P4_B12.2.cover
## 235 2.160247581 5.1054682 2 P4_C03.2.cover
## 236 3.218808885 -3.4240702 1 P4_C04.2.cover
## 237 -2.478900770 2.5632862 2 P4_C05.2.cover
## 238 -7.831665261 -1.0381231 2 P4_C06.2.cover
## 239 3.229347993 -0.6244680 2 P4_C07.2.cover
## 240 -7.572952941 -1.2888724 2 P4_C08.2.cover
## 241 0.709854379 6.7656756 2 P4_C10.2.cover
## 242 2.201811407 -8.7351986 3 P4_C11.2.cover
## 243 0.736151315 -8.0357950 3 P4_D01.2.cover
## 244 -0.467769875 5.7811579 2 P4_D02.2.cover
## 245 3.628650525 -3.5623973 1 P4_D03.2.cover
## 246 2.604063891 -5.0100582 1 P4_D04.2.cover
## 247 0.497986405 -2.5039683 2 P4_D05.2.cover
## 248 4.384333615 -1.9646056 2 P4_D06.2.cover
## 249 -1.166713517 -6.9643958 2 P4_D07.2.cover
## 250 2.292279194 -9.2400300 3 P4_D08.2.cover
## 251 1.523576617 6.1050974 2 P4_D09.2.cover
## 252 5.144619343 -1.9097402 1 P4_D11.2.cover
## 253 1.878818948 -2.8360334 2 P4_D12.2.cover
## 254 -3.018590683 6.9117389 2 P4_E01.2.cover
## 255 3.886388645 -4.1104979 1 P4_E02.2.cover
## 256 0.359360272 -8.0283572 3 P4_E03.2.cover
## 257 1.433038767 -7.1440362 3 P4_E04.2.cover
## 258 0.588713831 -6.6319443 3 P4_E05.2.cover
## 259 5.286880485 -1.5161597 2 P4_E06.2.cover
## 260 1.195286101 -8.3403477 3 P4_E07.2.cover
## 261 -6.454246287 -1.4974640 2 P4_E08.2.cover
## 262 4.572338929 -0.8873005 2 P4_E09.2.cover
## 263 -0.607556171 -7.5064632 2 P4_E11.2.cover
## 264 -3.017364549 3.8142714 2 P4_E12.2.cover
## 265 0.412426378 7.1260637 2 P4_F01.2.cover
## 266 2.234044014 -8.6175908 3 P4_F02.2.cover
## 267 3.975856508 -3.1020318 1 P4_F03.2.cover
## 268 -7.758516096 -1.1133699 2 P4_F04.2.cover
## 269 -7.179736795 -1.9521758 2 P4_F05.2.cover
## 270 1.247096828 -6.8129322 3 P4_F06.2.cover
## 271 -0.113909003 -7.7541552 2 P4_F07.2.cover
## 272 2.192815584 -8.7418282 3 P4_F08.2.cover
## 273 1.815132681 -8.9922606 3 P4_F09.2.cover
## 274 -7.673490950 -1.1954763 2 P4_F10.2.cover
## 275 -2.395258493 6.9915644 2 P4_F12.2.cover
## 276 -2.382633033 6.1683224 2 P4_G01.2.cover
## 277 -2.571127253 5.8769224 2 P4_G07.2.cover
## 278 -3.817388578 5.4309519 2 P4_G09.2.cover
## 279 -7.670582044 -1.1956385 2 P4_G11.2.cover
## 280 2.318958141 4.2928427 2 P4_H01.2.cover
## 281 2.318958141 4.2928427 2 P4_H06.2.cover
## 282 -3.864879563 4.3702219 2 P4_H07.2.cover
## 283 -7.758361718 -1.1134740 2 P4_H09.2.cover
## 284 -2.967260483 4.7425440 2 P4_H10.2.cover
## 285 -2.967260483 4.7425440 2 P4_H11.2.cover
## 286 -7.353633241 -1.4551700 2 P4_H12.2.cover