[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/moshi4/pybarrnap/blob/main/notebooks/pybarrnap.ipynb)

In [None]:
#!pip install pybarrnap

In [5]:
from pybarrnap import Barrnap
from pybarrnap.utils import load_example_fasta_file

# Get example fasta file path
fasta_file = load_example_fasta_file("bacteria.fna")

# Run pybarrnap rRNA prediction
barrnap = Barrnap(fasta_file, evalue=1e-6, lencutoff=0.8, reject=0.25, threads=1, kingdom="bac", quiet=False)
result = barrnap.run()

# Output rRNA GFF file
result.write_gff("bacteria_rrna.gff")
# Output rRNA GFF file (Include input fasta sequence)
result.write_gff("bacteria_rrna_incseq.gff", incseq=True)
# Output rRNA fasta file
result.write_fasta("bacteria_rrna.fna")

# Get rRNA GFF text and print
print("\n========== Print rRNA GFF ==========")
print(result.get_gff_text())

# Get rRNA features and print
print("\n========== Print rRNA features ==========")
for rec in result.seq_records:
    for feature in rec.features:
        print(feature.id, feature.type, feature.location, feature.qualifiers)

# Get rRNA sequences and print
print("\n========== Print rRNA sequences ==========")
for rec in result.get_rrna_seq_records():
    print(f">{rec.id}\n{rec.seq}")

2024-01-29 18:58:48 | INFO | Run pybarrnap v0.1.0
2024-01-29 18:58:48 | INFO | Operating System: linux
2024-01-29 18:58:48 | INFO | Check Dependencies: pyhmmer v0.10.4 is installed
2024-01-29 18:58:48 | INFO | Check Dependencies: biopython v1.83 is installed
2024-01-29 18:58:48 | INFO | Set Option: evalue=1e-06
2024-01-29 18:58:48 | INFO | Set Option: lencutoff=0.8
2024-01-29 18:58:48 | INFO | Set Option: reject=0.25
2024-01-29 18:58:48 | INFO | Set Option: threads=1
2024-01-29 18:58:48 | INFO | Set Option: kingdom='bac'
2024-01-29 18:58:48 | INFO | Number of Target Sequence = 1
2024-01-29 18:58:48 | INFO | Seq1. name='E.coli', length=4,639,675, description='E.coli Escherichia coli str. K-12 substr. MG1655, complete genome'
2024-01-29 18:58:48 | INFO | Use HMM DB: /home/ys/Desktop/Project/Bioinformatics/pybarrnap/src/pybarrnap/db/bac.hmm
2024-01-29 18:58:48 | INFO | Run pyhmmer.nhmmer
2024-01-29 18:58:51 | INFO | Found: 16S_rRNA E.coli 3425244..3426781(-) L=1538/1585(97.03%)
2024-01-29


##gff-version 3
E.coli	pybarrnap:0.1.0	rRNA	223774	225311	0.0	+	.	Name=16S_rRNA;product=16S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	225761	228661	0.0	+	.	Name=23S_rRNA;product=23S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	228760	228870	8.7e-12	+	.	Name=5S_rRNA;product=5S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	2724096	2724206	8.7e-12	-	.	Name=5S_rRNA;product=5S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	2724304	2727204	0.0	-	.	Name=23S_rRNA;product=23S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	2727639	2729176	0.0	-	.	Name=16S_rRNA;product=16S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	3421450	3421560	2e-11	-	.	Name=5S_rRNA;product=5S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	3421695	3421805	8.7e-12	-	.	Name=5S_rRNA;product=5S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	3421903	3424803	0.0	-	.	Name=23S_rRNA;product=23S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	3425244	3426781	0.0	-	.	Name=16S_rRNA;product=16S ribosomal RNA
E.coli	pybarrnap:0.1.0	rRNA	3939834	3941371	0.0	+	.	Name=16S_rR