library(dplyr)
library(readr)
megamap <- "/pita/pub/data/16S_DBs/maps/DB1-31_premap_v3.txt"pedbank
Pedbank
megamap |> read_tsv() |>
filter(Cohort == "pedbank") |>
filter(reads_number > 4000) |>
distinct(sample_ID, .keep_all = T) |>
pull(reads_number) |> summary() Min. 1st Qu. Median Mean 3rd Qu. Max.
4003 7296 12208 15109 19567 85763