## **Gene configuration**
The code uses the Biopython Bio.Entrez and Bio.SeqIO libraries to interact with the NCBI and process the genetic sequences under study, focusing on nucleotide sequences in GenBank format.

In [1]:
from Bio import Entrez
from Bio import SeqIO
from Bio.Seq import Seq
import os

# Setting up email for use in NCBI Entrez
Entrez.email = 'A.N.Other@example.com'

def download_gene(id_gene: str, name_gene: str, start=None, end=None, complement=False):
    """
    Downloads a GenBank sequence from NCBI, with the option of specifying a region and calculating the reverse complement.

    Args:
    - id_gene (str): The access ID in the NCBI database.
    - name_gene (str): Name of the file to store the sequence.
    - start (int, optional): Starting position of the region of interest.
    - end (int, optional): End position of the region of interest.
    - complement (bool, optional): If True, calculates the reverse complement of the sequence.
    """
    try:
        # Criar a pasta 'genes' se ela não existir
        if not os.path.exists("genes"):
            os.makedirs("genes")
        
        # Search NCBI for sequence data
        if start and end:
            handle = Entrez.efetch(db="nucleotide", rettype="gb", retmode="text", id=id_gene, seq_start=start, seq_stop=end)
        else:
            handle = Entrez.efetch(db="nucleotide", rettype="gb", retmode="text", id=id_gene)
        
        # Processing the GenBank record
        seq_record = SeqIO.read(handle, "gb")
        handle.close()
        
        # Calculate the reverse complement, if necessary
        if complement:
            seq_record.seq = seq_record.seq.reverse_complement()
        
        # Save the sequence in the 'genes' folder
        output_path = os.path.join("genes", f"{name_gene}.gb")
        SeqIO.write(seq_record, output_path, "gb")
        
        print(f"Download the GenBank file of the gene '{name_gene}' successfully completed.")
    
    except Exception as e:
        print(f"Error downloading the gene {id_gene}: {e}")

# Download the genes with the specified parameters
download_gene("NZ_DS483503", "butyrylCoA", start=313586, end=314932, complement=False)
download_gene("NZ_DS483503", "ptsP", start=23763, end=25406, complement=True)
download_gene("NZ_DS483503", "MutS", start=859977 , end=868082  , complement=False)


Download the GenBank file of the gene 'butyrylCoA' successfully completed.
Download the GenBank file of the gene 'ptsP' successfully completed.
Download the GenBank file of the gene 'MutS' successfully completed.


The code uses the Biopython Bio.Entrez and Bio.SeqIO libraries to interact with NCBI and download gene sequences, focusing on sequences in FASTA format.

In [2]:
import os
from Bio import Entrez
from Bio import SeqIO

Entrez.email = 'A.N.Other@example.com'

def download_fasta(gene_id, filename):
    """
    Downloads the FASTA file with gene sequences and saves it in the 'genes' folder.

    Args:
    - gene_id (str): The gene ID in the NCBI database.
    - filename (str): The filename to save the FASTA sequence.
    """
    try:
        # Create the 'genes' folder if it does not exist
        if not os.path.exists("genes"):
            os.makedirs("genes")
        
        file_path = os.path.join("genes", filename)
        
        # Fetch and save the FASTA sequence
        handle = Entrez.efetch(db="protein", id=gene_id, rettype="fasta", retmode="text")
        with open(file_path, "w") as out_file:
            out_file.write(handle.read())
        handle.close()
        
        print(f"FASTA download for gene {gene_id} completed and saved in {file_path}.")
    except Exception as e:
        print(f"Error downloading gene {gene_id}: {e}")

# Download FASTA genes with the specified parameters
download_fasta('WP_044960620', 'butyrylCoA.fasta')
download_fasta('WP_005925321', 'ptsP.fasta')
download_fasta('WP_341271153', 'MutS.fasta')


FASTA download for gene WP_044960620 completed and saved in genes\butyrylCoA.fasta.
FASTA download for gene WP_005925321 completed and saved in genes\ptsP.fasta.
FASTA download for gene WP_341271153 completed and saved in genes\MutS.fasta.
