# Example: Metabolite workflow

This notebook provides insights on how to use the tool if you have list of metabolites.
Our current data sources include:
* MolMeDB

In [1]:
# Import modules
import pandas as pd

from pyBiodatafuse import id_mapper
from pyBiodatafuse.annotators import molmedb
from pyBiodatafuse.utils import combine_sources

# Load list of metabolites/chemicals/compounds

In [2]:
metabolites_of_interest = """100208
10040286
10041551
10025195"""
metabolite_list = metabolites_of_interest.split("\n")
len(metabolite_list)

4

In [3]:
data_input = pd.DataFrame(metabolite_list, columns=["identifier"])
data_input.head()

Unnamed: 0,identifier
0,100208
1,10040286
2,10041551
3,10025195


In [4]:
bridgdb_df, bridgdb_metadata = id_mapper.bridgedb_xref(
    identifiers=data_input,
    input_species="Human",
    input_datasource="PubChem Compound",
    output_datasource="All",
)
bridgdb_df.head(25)

Unnamed: 0,identifier,identifier.source,target,target.source
0,100208,PubChem-compound,90560,ChemSpider
1,100208,PubChem-compound,100208,PubChem Compound
2,100208,PubChem-compound,HMDB0244377,HMDB
3,100208,PubChem-compound,OFDNQWIFNXBECV-UHFFFAOYSA-N,InChIKey
4,100208,PubChem-compound,C11280,KEGG Compound
5,100208,PubChem-compound,Q104246146,Wikidata
6,10040286,PubChem-compound,10040286,PubChem Compound
7,10040286,PubChem-compound,CHEMBL602850,ChEMBL compound
8,10040286,PubChem-compound,Q27163373,Wikidata
9,10040286,PubChem-compound,91540,ChEBI


In [5]:
transporter_inhibited_df, transporter_inhibited_metadata = molmedb.get_mol_gene_inhibitor(
    bridgedb_df=bridgdb_df
)
transporter_inhibited_df.head()

Unnamed: 0,identifier,identifier.source,target,target.source,transporter_inhibited
0,100208,PubChem-compound,OFDNQWIFNXBECV-UHFFFAOYSA-N,InChIKey,"[{'uniprot_trembl_id': 'P08183', 'hgcn_id': 'A..."
1,10025195,PubChem-compound,LEJRLSZVESQKJK-UHFFFAOYSA-N,InChIKey,"[{'uniprot_trembl_id': 'Q01959', 'hgcn_id': 'S..."
2,10040286,PubChem-compound,FYGREZKTJIXWIH-UHFFFAOYSA-N,InChIKey,"[{'uniprot_trembl_id': 'Q01959', 'hgcn_id': 'S..."
3,10041551,PubChem-compound,OVVBIIBBRZVPAL-UHFFFAOYSA-N,InChIKey,"[{'uniprot_trembl_id': 'P23975', 'hgcn_id': 'S..."


In [6]:
transporter_inhibited_df["transporter_inhibited"][0]

[{'uniprot_trembl_id': 'P08183',
  'hgcn_id': 'ABCB1',
  'source_doi': 'doi:10.1074/jbc.271.6.3163',
  'source_pmid': '8621716'}]