shRNA design to target circRNAs

#install library
#devtools::install_github("ipatop/circRNAshRNAdesign")
library(circRNAshRNAdesign)

Description

This package contains ONE function that will generate a DataFrame or tab separated file with the original table with the shRNA oligo design appended.

The input should be a tab sepparated table with circRNA back-splicing junction coordinates and gene names in the format:

Name Chr Start End

This table can have an optional column with the Strand

So far the following species are available:

Fly: dm3, dm6 Human: hs19, and hg38 Mice: mm10 Rat: rn4

Requiered packages

The following packages are required, here how to install it

install.packages("dplyr")
install.packages("tidyr")
BiocManager::install("Rsubread")
BiocManager::install("GenomicFeatures")
BiocManager::install("Biostrings")
BiocManager::install("TxDb.Dmelanogaster.UCSC.dm6.ensGene")
BiocManager::install("BSgenome.Dmelanogaster.UCSC.dm6")
BiocManager::install("TxDb.Dmelanogaster.UCSC.dm3.ensGene")
BiocManager::install("BSgenome.Dmelanogaster.UCSC.dm3")
BiocManager::install("TxDb.Hsapiens.UCSC.hg19.knownGene")
BiocManager::install("BSgenome.Hsapiens.UCSC.hg19")
BiocManager::install("TxDb.Hsapiens.UCSC.hg38.knownGene")
BiocManager::install("BSgenome.Hsapiens.UCSC.hg38")
BiocManager::install("TxDb.Mmusculus.UCSC.mm10.knownGene")
BiocManager::install("BSgenome.Mmusculus.UCSC.mm10")
BiocManager::install("TxDb.Rnorvegicus.UCSC.rn4.ensGene")
BiocManager::install("BSgenome.Rnorvegicus.UCSC.rn4")

Run example

Input should look like this

head(read.delim("../test/circs_totest.txt"))
#>                       dm6                       circ_name  SYMBOL   Chr
#> 1 chr2R:17275410-17276063     mbl_chr2R:17275410-17276063     mbl chr2R
#> 2 chr3L:24725824-24726292    scro_chr3L:24725824-24726292    scro chr3L
#> 3   chr2R:5423750-5424239        NA_chr2R:5423750-5424239    <NA> chr2R
#> 4   chr3R:4626973-4628349    5-HT2A_chr3R:4626973-4628349  5-HT2A chr3R
#> 5 chr3L:12851309-12852277    Wbp2_chr3L:12851309-12852277    Wbp2 chr3L
#> 6 chr2R:15735091-15737060 CG30089_chr2R:15735091-15737060 CG30089 chr2R
#>      Start      End
#> 1 17275410 17276063
#> 2 24725824 24726292
#> 3  5423750  5424239
#> 4  4626973  4628349
#> 5 12851309 12852277
#> 6 15735091 15737060

Run to create an output table

OligoDesigner(input_coordinates = "../test/circs_totest.txt",output = "../test/New_out.tsv")
#> Loading required package: TxDb.Dmelanogaster.UCSC.dm6.ensGene
#> Loading required package: GenomicFeatures
#> Loading required package: BiocGenerics
#> 
#> Attaching package: 'BiocGenerics'
#> The following objects are masked from 'package:stats':
#> 
#>     IQR, mad, sd, var, xtabs
#> The following objects are masked from 'package:base':
#> 
#>     anyDuplicated, append, as.data.frame, basename, cbind, colnames,
#>     dirname, do.call, duplicated, eval, evalq, Filter, Find, get, grep,
#>     grepl, intersect, is.unsorted, lapply, Map, mapply, match, mget,
#>     order, paste, pmax, pmax.int, pmin, pmin.int, Position, rank,
#>     rbind, Reduce, rownames, sapply, setdiff, sort, table, tapply,
#>     union, unique, unsplit, which.max, which.min
#> Loading required package: S4Vectors
#> Loading required package: stats4
#> 
#> Attaching package: 'S4Vectors'
#> The following objects are masked from 'package:base':
#> 
#>     expand.grid, I, unname
#> Loading required package: IRanges
#> Loading required package: GenomeInfoDb
#> Loading required package: GenomicRanges
#> Loading required package: AnnotationDbi
#> Loading required package: Biobase
#> Welcome to Bioconductor
#> 
#>     Vignettes contain introductory material; view with
#>     'browseVignettes()'. To cite Bioconductor, see
#>     'citation("Biobase")', and for packages 'citation("pkgname")'.
#> Loading required package: BSgenome.Dmelanogaster.UCSC.dm6
#> Loading required package: BSgenome
#> Loading required package: Biostrings
#> Loading required package: XVector
#> 
#> Attaching package: 'Biostrings'
#> The following object is masked from 'package:base':
#> 
#>     strsplit
#> Loading required package: rtracklayer
#> [1] "Generating sequence for circ 1"
#> [1] "Generating sequence for circ 2"
#> [1] "Generating sequence for circ 3"
#> [1] "Generating sequence for circ 4"
#> [1] "Generating sequence for circ 5"
#> [1] "Generating sequence for circ 6"
#> [1] "Generating sequence for circ 7"

Run to create a DataFrame, if writetab = F

oligos<-OligoDesigner(input_coordinates = "../test/circs_totest.txt",output = "../test/New_out.tsv",writetab = F)
#> [1] "Generating sequence for circ 1"
#> [1] "Generating sequence for circ 2"
#> [1] "Generating sequence for circ 3"
#> [1] "Generating sequence for circ 4"
#> [1] "Generating sequence for circ 5"
#> [1] "Generating sequence for circ 6"
#> [1] "Generating sequence for circ 7"

Output

head(oligos)
#>                       dm6                       circ_name  SYMBOL   Chr
#> 1 chr2R:17275410-17276063     mbl_chr2R:17275410-17276063     mbl chr2R
#> 2 chr3L:24725824-24726292    scro_chr3L:24725824-24726292    scro chr3L
#> 3   chr2R:5423750-5424239        NA_chr2R:5423750-5424239    <NA> chr2R
#> 4   chr3R:4626973-4628349    5-HT2A_chr3R:4626973-4628349  5-HT2A chr3R
#> 5 chr3L:12851309-12852277    Wbp2_chr3L:12851309-12852277    Wbp2 chr3L
#> 6 chr2R:15735091-15737060 CG30089_chr2R:15735091-15737060 CG30089 chr2R
#>      Start      End     exon_start       exon_end length
#> 1 17275410 17276063 chr2R:17275410 chr2R:17276063    653
#> 2 24725824 24726292 chr3L:24725824 chr3L:24726292    468
#> 3  5423750  5424239  chr2R:5423750  chr2R:5424239    489
#> 4  4626973  4628349  chr3R:4626973  chr3R:4628349   1376
#> 5 12851309 12852277 chr3L:12851309 chr3L:12852277    968
#> 6 15735091 15737060 chr2R:15735091 chr2R:15737060   1969
#>                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  seq
#> 1                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     ATAATGTAAACTCAGCTTACACACAAAAAAGCAGTAAAATATAAAATACAAAAATTAACAGCTGCGTTTATCTATAGATATATATATACACATCTATATATTTGAATAAGCGTTCGATTTGAATCAAAATTATAGCCCAAGCTATCAGCTACCCCCACAAGCTTTGTACTCCACAAAAACGCTAACGAGCAAAATCGATAAAGACCAGATAGCAAATGAAATCATACCATCTGCCATAGATCTATGCTATAAACATATATAGGTGCTGATCTGTGCTCTTGAATTTAGTGTTTTTTGTGTGTGCGTGTCGCGAGAGGAGCACTCAAAACCAAAAAAAAAAAAAAAAACGTATAGTAAAACAAAAAACTATCTCTAGTCGCTAGGCTATAACTATACAAACTCCAGCTATCCCAGATCCAGATCCGTAAACAGCAAATAGTTATATATCTATAACCCCAAAATACGATGGCCAACGTTGTCAATATGAACAGCCTGCTCAACGGCAAGGATTCGCGCTGGCTGCAATTGGAGGTCTGTCGCGAGTTCCAGCGCAACAAATGCTCGCGCCAGGACACCGAATGCAAGTTCGCCCATCCCCCGGCCAACGTGGAGGTCCAGAACGGCAAGGTCACCGCCTGCTACGACAGCATCAAG
#> 2                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              CGATAAAAGCCTACTACCAACTTGTAAAACAATTGTTACGCATGTCATCGCACGGCCTTGCTTACACAACAAGAATTGAAAGAAAGTCTTATAGAGAACTACAAATCAATAGAGATCAATACTTTGTAACTGCGCCAAATGAAGAAGATTTGGTTATGAGTTTATCTCCAAAGGACACACTTATACATACTGCCATTTCCCAGCACCATCAAGTGGATACTTCTACTAAATTAAATACAAACGAAACATCGACACAAAATACCGTATCTACAGCAGCCGCGGCAGCGGTTGCACATCACCACCACAACCTTTCTAGTATTCACCACCTCCAAAACCTGCATAGTCAGCATCAAAGTACTTTATTTAATAGTAATCACTCAACACCCTTTAGCGTGACCGATATCTTAAGTCCAATTGAAGAATCGTATCGCAAACTGGAACTGAACGGAAATCCACCATCTCCGTTTCG
#> 3                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         AAAATCAACCAGATCTTACACCAATGGGGTCCTTCTGGCAGCAACATGTGGCCACTCCTAGTAGTTCAACTCCATTCGATTCACCATTTTTTTCGGCAACACACGGCCTTGTGCAGACTCACCCGTCTATAGGTGGAAGCCACTCTGGGCCCGCTCCATTAAATGGCAATAGCCTTGGGTCTGGAGCTCCATCCTCAATCCTAGCTGGTACTAAGCCAGCCCTAACCGCTGGAAGCGGTTACCTAAACTCACGCGGGAGTCTACCGACCTCTGCACGTTATCCAGCTAATAAGATCACAGGAACCGTCGTGGAACCCAACCCAAAATCTCCATTCCGCCACTTAGATTTCTCTACTAGTGCAACTGCCGAGCTGCGGCGCAATCCTGCGCTATCTGCTCCTGATGAATGTGCACGCGCTTGTCGCGAAGGCGAGCCTCCGAGAATTTGCTACTATCATTTTACGTTGGAATACTACACAGTATTGGGAGC
#> 4                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               GGTATTGGCCACTTGGCTTTACCTGGTGCAACATTTATGTGACGTGTGACGTACTGGCCTGCTCATCCAGTATATTGCACATGTGCTTCATCAGTTTGGGACGCTATATGGGAATAAGAAATCCATTGGGCTCGAGGCATCGATCTACGAAACGATTGACTGGTATAAAGATAGCCATTGTTTGGGTAATGGCCATGATGGTATCCAGTTCAATAACCGTTCTTGGTCTGGTCAATGAGAAGAACATAATGCCCGAGCCTAACATATGCGTTATCAACAATCGCGCCTTTTTCGTGTTTGGATCTCTGGTAGCTTTTTATATACCCATGCTGATGATGGTTACCACATACGCATTGACGATTCCCCTCCTCCGGAAGAAAGCGCGATTTGCCGCCGAGCACCCGGAAAGTGAACTTTTTCGCAGGTTGGGTGGACGCTTCACCCTAAGGCCGCAGCACAGCCAGCAGCAGTTGCAGATGTTCAGTAGCTTTTCTGGCAGCAATAACAAATTCCTATCAATGGGCGACGGCAATCGCAACTTCAACACTGAAGGAGAGATGGAGGAGGGTGGAGCTCCTAGCAGAAGGAGTGGCGTAGAGCCCGCCGAACGACCTTTGATGCAACAGCGAACGGCGAGCAGCAGGAGCATGGGCACGGTTAGTTTCCGTAATGTCGTGAACGGGACTAGCGGAGCCGCAGGAAGTGGGCGCAGGACGACTGGCACTGCCCACAGCAGCTTCCGGTTCTCTGGCGCCGGCATCTTTCGGCACTCGTCGTCGTCTCCCGCCTCGAGCTGCCACTCCACCAGCACGTCGCGTTCGAGCTCCTTCTGGCGCAAACACGGCGGCTATCCAAACCTAATGGACAG
#> 5                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              CACCACCTGCTCACCAACCAGCACCGCAACAGCCGCAGGCACCGTCGTCGAATGAACCCAATTGGTATGGTTTTTCAGCGCCGCCGCCGCAGCAGCAACAACAGCAGCCGGGCTATGGGCCACAAGGATGGGCCGGTGGCTATGTCCAACCTCCGCCGTACGCTTCATGTGCCCCAAATTGTCCACCACAGCCGCCGTACGCCGCTCCGGCTCAGACGTACAATGGTCCACAGCCATATGGTGGATACGGCAATGTTCCTGGCGGATTTAATACCCCCGGATTTCAGCAACCGAATGGAAATCCAAATGGCTATCCAGGTGGACCACCGCCACCCGGACAACAAGCAGCAGGAGCAGCTGGAGGAGCCGCCGCATCTGGAGCCAGCTTTATGGGCTTCAGCTTGCCCCCTGGAACAAAAGATAAAAAAATATGAGCAAAAGGACAAGAAAATTATGAACATCTTTAAAATAGTCGAAACATCTAAAGATCTAAAATGTTATCAAGAATTTAATTGAAGTATCATGAACCACCTTTTGCTTTCGGACGCTCAAAGTATTCAAGAGGCATCCAAAAACCATTCAGAAGCATTCGTTCTGTTTATTTTTCTCACTTACAAAATTATTCAATTTGTCCAAATAATAAATGATTTGTTAGCATAATTCTGTAATTAAAAGCAAACTACTGTACCTCAAATAGCCATCCCGACAA
#> 6 AATTGCGATCCATTCACGCCAGCAACTGCAACGCAGCACAACAGCAACACTGAGACAACGGCAACGGAAACACAAAGCCCAGCAACGAATGCAAGATCACAACAAAGCGAGAAAAACCCAGGCAGCAGCGCAGCGAATTGCATTATCAATGAACAGAGAGATGAGGCAGCAACTGCAACAGCGACATCAGCAGCAGCAGCTGCAGCAGCGGCAGCAGGGGCAGGGAATGAGGAAACCAGCTCGGTGGCAGTGCAGGTCAGTCAACCTGTTTCCTGTACCGCCAGAGAGCGTAGAGAGCTGCTGAGAGCCAGCAACACGAACACGCCAGCGAGCAGCAGCAGCAGCACCAGCAGCGCCAGCAACATTAGCTACGCGAGCAACATCAGCGGCGAGCGCTCAGCGATCAGTCTCTCGGCAACTTTCGGCGGGCCAACGCTGTACAGCGCGAGCAGCAGCAACCGGAATTGCTACAACAGCAGCAGCAGCAGCAGCAACTATCGCCCACTGTACGACGATTCGAGTAGCAGCAGCGTGCTGCGGCCCAACAAATGTTTGGCAGAACTCGAGCGTCTCTATGCCGAATTTCGCGCGAGTGAAAGCAGATTCGAACGGGGTCTGATCCAGTGCCAGTTGGACATTGAAAACGCCAACGCCACCGACACCGTTAGCGAAATGCGTCTAAATGTGCCAGCCACTGCGGCAGCAGACACTGTTGCTAGTTGTAGCAACAGCAACAGCAGCAGCAACAACAACAGCAGCAGCAGCAGCAGTGTGTTCCTCAATGTGTCCGGCAGCAGCAGCACCGATAGCGGCGACAATCAAGTTGTCGATGAGGCTAGAAGCATTAGCAACATTGCTGTGCTGCCAGCAACAGCAACTGCAACAACAACAACAGCCACTTCCAAGTCCTGCCAGCGACAGCCGAGCCTAACGATCCAAGTGAACAACAACAACAACAACAACAACAATAACAACGGCAACACTAACGGTACTAGTAACGGCAATCGGGTCTCGGTGGCTTCGCCCACGAGCATTGTGAACAACAACAACGGCGTGTGCGTTGTCAACTGCAGCTACACCCCCAGCAGCAGCAGCAGCAACAACAACAGCAGCAGCAGCAGCAGCAGCTGCATCAGCAACACCACCAACAGCAACATCAGCAACAATAACAGCGTGGTTGAAATCAATAAGTGTGTGCCAGCAGCAGCCAAAGTGTTTAGTGCAAGTGTTCAAAATCAAAATAGGCTCAATAATAATAGTAGCTGCCCAAAAGGGGATCAGCAACATGTTGCTGCTGCATCCACGGCCAGCAATAATAATCATGTGCAGCCTGATAACAGTGTGAATATAATCAGTGTGAATGCAAGCAGCAGCAGCTACAATAATAACCACCCACGCACCTTCACCTCAACGGAATGCCAAACGGATGATCTGTCAGCCAGTACATCATCCAACATGCAACAGCAACACCAGCAGCAGCAGCAGCAGCAACAGATCCGGACACGGGAGCAACGTCGCAAGGAGCGGCGGGAACGCCGGCAGCAGCAACAGCAGCAACAACAGTTTCAGCCACACCATGCGCGACGCCACCCGCCCCCACCTCCTCCGCCACAACTACACCCACCACCGCATCTGCACCACCCACATCCCCACCCACTTCCCCACCCTCATCCGGCTGCCATGGGACTGGCACGCGCTCTGTTGCCCGACATCCTGCACGCCCACTACCCGCCGCCCTATACTGCTCTGCCCGTGCCCGTGGCCATGTCCGCCGCTCCGCCACCGCCGCCCCCGTCGACTGCCGTTGCGGCATCTGCTGTTGCGGCGGCGGCACAGCAGCCAGCACATGCAAGTCCGGCTCCTCCGCCAGCGCTGACGTCCGTGATATCGACGGTGCCACTGCCGGGTCCGCTGCCAGCGCCTCTCATGAACGACGGACGCTTCACGCTGCCGCTGCCCATCATGCGCAG
#>   Strand              junction      junction_revcomp
#> 1      1 CAGCATCAAGATAATGTAAAC GTTTACATTATCTTGATGCTG
#> 2      1 CTCCGTTTCGCGATAAAAGCC GGCTTTTATCGCGAAACGGAG
#> 3      1 TATTGGGAGCAAAATCAACCA TGGTTGATTTTGCTCCCAATA
#> 4      1 TAATGGACAGGGTATTGGCCA TGGCCAATACCCTGTCCATTA
#> 5      1 ATCCCGACAACACCACCTGCT AGCAGGTGGTGTTGTCGGGAT
#> 6      1 TCATGCGCAGAATTGCGATCC GGATCGCAATTCTGCGCATGA
#>                                                                 TopStrand
#> 1 ctagcagtCAGCATCAAGATAATGTAAACtagttatattcaagcataGTTTACATTATCTTGATGCTGgcg
#> 2 ctagcagtCTCCGTTTCGCGATAAAAGCCtagttatattcaagcataGGCTTTTATCGCGAAACGGAGgcg
#> 3 ctagcagtTATTGGGAGCAAAATCAACCAtagttatattcaagcataTGGTTGATTTTGCTCCCAATAgcg
#> 4 ctagcagtTAATGGACAGGGTATTGGCCAtagttatattcaagcataTGGCCAATACCCTGTCCATTAgcg
#> 5 ctagcagtATCCCGACAACACCACCTGCTtagttatattcaagcataAGCAGGTGGTGTTGTCGGGATgcg
#> 6 ctagcagtTCATGCGCAGAATTGCGATCCtagttatattcaagcataGGATCGCAATTCTGCGCATGAgcg
#>                                                                 BotStrand
#> 1 aattcgcCAGCATCAAGATAATGTAAACtatgcttgaatataactaGTTTACATTATCTTGATGCTGactg
#> 2 aattcgcCTCCGTTTCGCGATAAAAGCCtatgcttgaatataactaGGCTTTTATCGCGAAACGGAGactg
#> 3 aattcgcTATTGGGAGCAAAATCAACCAtatgcttgaatataactaTGGTTGATTTTGCTCCCAATAactg
#> 4 aattcgcTAATGGACAGGGTATTGGCCAtatgcttgaatataactaTGGCCAATACCCTGTCCATTAactg
#> 5 aattcgcATCCCGACAACACCACCTGCTtatgcttgaatataactaAGCAGGTGGTGTTGTCGGGATactg
#> 6 aattcgcTCATGCGCAGAATTGCGATCCtatgcttgaatataactaGGATCGCAATTCTGCGCATGAactg
#>              junction5p    junction_revcomp5p
#> 1 CATCAAGATAATGTAAACTCA TGAGTTTACATTATCTTGATG
#> 2 CGTTTCGCGATAAAAGCCTAC GTAGGCTTTTATCGCGAAACG
#> 3 TGGGAGCAAAATCAACCAGAT ATCTGGTTGATTTTGCTCCCA
#> 4 TGGACAGGGTATTGGCCACTT AAGTGGCCAATACCCTGTCCA
#> 5 CCGACAACACCACCTGCTCAC GTGAGCAGGTGGTGTTGTCGG
#> 6 TGCGCAGAATTGCGATCCATT AATGGATCGCAATTCTGCGCA
#>                                                               TopStrand5p
#> 1 ctagcagtCATCAAGATAATGTAAACTCAtagttatattcaagcataTGAGTTTACATTATCTTGATGgcg
#> 2 ctagcagtCGTTTCGCGATAAAAGCCTACtagttatattcaagcataGTAGGCTTTTATCGCGAAACGgcg
#> 3 ctagcagtTGGGAGCAAAATCAACCAGATtagttatattcaagcataATCTGGTTGATTTTGCTCCCAgcg
#> 4 ctagcagtTGGACAGGGTATTGGCCACTTtagttatattcaagcataAAGTGGCCAATACCCTGTCCAgcg
#> 5 ctagcagtCCGACAACACCACCTGCTCACtagttatattcaagcataGTGAGCAGGTGGTGTTGTCGGgcg
#> 6 ctagcagtTGCGCAGAATTGCGATCCATTtagttatattcaagcataAATGGATCGCAATTCTGCGCAgcg
#>                                                               BotStrand5p
#> 1 aattcgcCATCAAGATAATGTAAACTCAtatgcttgaatataactaTGAGTTTACATTATCTTGATGactg
#> 2 aattcgcCGTTTCGCGATAAAAGCCTACtatgcttgaatataactaGTAGGCTTTTATCGCGAAACGactg
#> 3 aattcgcTGGGAGCAAAATCAACCAGATtatgcttgaatataactaATCTGGTTGATTTTGCTCCCAactg
#> 4 aattcgcTGGACAGGGTATTGGCCACTTtatgcttgaatataactaAAGTGGCCAATACCCTGTCCAactg
#> 5 aattcgcCCGACAACACCACCTGCTCACtatgcttgaatataactaGTGAGCAGGTGGTGTTGTCGGactg
#> 6 aattcgcTGCGCAGAATTGCGATCCATTtatgcttgaatataactaAATGGATCGCAATTCTGCGCAactg
#>              junction3p    junction_revcomp3p
#> 1 CGACAGCATCAAGATAATGTA TACATTATCTTGATGCTGTCG
#> 2 CATCTCCGTTTCGCGATAAAA TTTTATCGCGAAACGGAGATG
#> 3 CAGTATTGGGAGCAAAATCAA TTGATTTTGCTCCCAATACTG
#> 4 ACCTAATGGACAGGGTATTGG CCAATACCCTGTCCATTAGGT
#> 5 GCCATCCCGACAACACCACCT AGGTGGTGTTGTCGGGATGGC
#> 6 CCATCATGCGCAGAATTGCGA TCGCAATTCTGCGCATGATGG
#>                                                               TopStrand3p
#> 1 ctagcagtCGACAGCATCAAGATAATGTAtagttatattcaagcataTACATTATCTTGATGCTGTCGgcg
#> 2 ctagcagtCATCTCCGTTTCGCGATAAAAtagttatattcaagcataTTTTATCGCGAAACGGAGATGgcg
#> 3 ctagcagtCAGTATTGGGAGCAAAATCAAtagttatattcaagcataTTGATTTTGCTCCCAATACTGgcg
#> 4 ctagcagtACCTAATGGACAGGGTATTGGtagttatattcaagcataCCAATACCCTGTCCATTAGGTgcg
#> 5 ctagcagtGCCATCCCGACAACACCACCTtagttatattcaagcataAGGTGGTGTTGTCGGGATGGCgcg
#> 6 ctagcagtCCATCATGCGCAGAATTGCGAtagttatattcaagcataTCGCAATTCTGCGCATGATGGgcg
#>                                                               BotStrand3p
#> 1 aattcgcCGACAGCATCAAGATAATGTAtatgcttgaatataactaTACATTATCTTGATGCTGTCGactg
#> 2 aattcgcCATCTCCGTTTCGCGATAAAAtatgcttgaatataactaTTTTATCGCGAAACGGAGATGactg
#> 3 aattcgcCAGTATTGGGAGCAAAATCAAtatgcttgaatataactaTTGATTTTGCTCCCAATACTGactg
#> 4 aattcgcACCTAATGGACAGGGTATTGGtatgcttgaatataactaCCAATACCCTGTCCATTAGGTactg
#> 5 aattcgcGCCATCCCGACAACACCACCTtatgcttgaatataactaAGGTGGTGTTGTCGGGATGGCactg
#> 6 aattcgcCCATCATGCGCAGAATTGCGAtatgcttgaatataactaTCGCAATTCTGCGCATGATGGactg