## Resultados do NCBI

In [1]:
import os, sys, inspect
import pandas as pd
from IPython.core.display import display, HTML

def import_modules():
    """
    Importar os módulos que desenvolvemos neste trabalho.
    """
    current_dir = os.path.dirname(os.path.abspath(inspect.getfile(inspect.currentframe())))
    parent_dir = os.path.dirname(current_dir)
    sys.path.insert(0, parent_dir)
    
def pretty_print_location(location):
    html = "<ul>"
    for p in ["start", "end", "strand"]:
        html += "<li><strong>" + p + ":</strong> " + str(location[p]) + "</li>"  
    html += "</ul>"
    return html

def main():
    import_modules()
    import util.rw as rw
    
    # mostra todas as linhas
    pd.options.display.max_rows = 250
    
    # não truncar informação
    pd.set_option('display.max_colwidth', -1)

    ncbi = rw.read_json("files/.ncbi.json")
    columns_to_show = ["uniprot_id", "type", "EC_number", "gene", "gene_id", "protein_id", "length", "location", "product"]

    df = pd.DataFrame(ncbi).transpose()
    df = df.fillna("")
    df["location"] = df["location"].apply(pretty_print_location)
    display(HTML(df[columns_to_show].to_html(escape=False)))
    
main()

Unnamed: 0,uniprot_id,type,EC_number,gene,gene_id,protein_id,length,location,product
lpg0232,Q5ZYX9_LEGPH,mRNA,,np20,19831799,YP_094286.1,177.0,start: 270036end: 270569strand: 1,transcriptional regulator np20
lpg0233,Q5ZYX8_LEGPH,mRNA,4.1.1.7,mdlC,19831800,YP_094287.1,530.0,start: 270686end: 272278strand: -1,benzoylformate decarboxylase
lpg0234,Q5ZYX7_LEGPH,mRNA,,sidE,19831801,YP_094288.1,1514.0,start: 272577end: 277121strand: -1,protein SidE
lpg0235,Q5ZYX6_LEGPH,mRNA,,,19831802,YP_094289.1,167.0,start: 277484end: 277987strand: -1,hypothetical protein
lpg0236,Q5ZYX5_LEGPH,mRNA,,,19831803,YP_094290.1,659.0,start: 278060end: 280039strand: -1,hypothetical protein
lpg0237,Q5ZYX4_LEGPH,mRNA,,mhpC,19831804,YP_094291.1,264.0,start: 280320end: 281114strand: 1,lipolytic protein
lpg0238,Q5ZYX3_LEGPH,mRNA,1.2.1.8,gbsA,19831805,YP_094292.1,488.0,start: 281131end: 282597strand: 1,glycine betaine aldehyde dehydrogenase
lpg0239,Q5ZYX2_LEGPH,mRNA,2.6.1.19,gabT,19831806,YP_094293.1,450.0,start: 282572end: 283924strand: 1,4-aminobutyrate transaminase
lpg0240,Q5ZYX1_LEGPH,mRNA,,recN,19831807,YP_094294.1,259.0,start: 284008end: 284787strand: 1,DNA repair protein
lpg0241,GLSA_LEGPH,mRNA,3.5.1.2,,19831808,YP_094295.1,310.0,start: 285047end: 285979strand: 1,glutaminase
