Basic functions for genomic sequence manipulation
import seq_toolkit
sequence = seq_toolkit.Seq()
sequence.simulate(n_bases=250, return_seq=True)
'GTTCAACTTTAACCAGCGGTTATGCTCTTCCATGTGAGTCGTAGTCGGGTTCGCACGAAAGAATTATTTATTGCTGCGATACGCAATGCATCTGGTTGTGGAGTTTCACCAGGCAGGCAATTAGTCCTATGCGGAACCTGCTGCTATAAAACGCATAAATTAACTGGCACACCAGGGAGGTAAGGGATGAGAGGCCTACAAGATTCCCATGTGCATATGGAGGGCGTACTGGATTCACGCGTTCGGAGGC'
import seq_toolkit
gene = seq_toolkit.Gene()
gene.create(n_exons=8, return_gene=False)
gene.plot()
- For more on ene simulation, see the following: example notebook
import seq_toolkit
seq = 'CGGGTTCGCACGAAAGAATTATTTATTGCTGCGATACGCAATGCATCTGGTTGTGGAGTTTCACCAGGCAGGCAATTAGTCCTATGCGGAACCTGCTGCTATAAAACGCAT'
sequence = seq_toolkit.SequenceManipulator(seq)
sequence.reverse_complement()
'ATGCGTTTTATAGCAGCAGGTTCCGCATAGGACTAATTGCCTGCCTGGTGAAACTCCACAACCAGATGCATTGCGTATCGCAGCAATAAATAATTCTTTCGTGCGAACCCG'
pip install seq-toolkit
To install the development version:
git clone https://github.com/mvinyard/seq-toolkit.git
cd ./seq-toolkit/; pip install -e .
For questions, please send an email to mvinyard@broadinstitute.org or open an issue.