# Metabolomic genes mining from *PathMeUniverse*

## 1.Importing Pathway-Datasets mappings from *ComPath*

In [1]:
import pandas as pd
import requests
import io

### 1.1. KEGG-Reactome Mapping

In [2]:
# Downloading the csv file from ComPath GitHub repository 
url = "https://raw.githubusercontent.com/ComPath/compath-resources/master/mappings/kegg_reactome.csv" # Make sure the url is the raw version of the file on GitHub
download = requests.get(url).content

# Reading and retrieving it into a pandas dataframe

kegg2reactome = pd.read_csv(io.StringIO(download.decode('utf-8')))
kegg2reactome.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
0,reactome,R-HSA-2978092,Abnormal conversion of 2-oxoglutarate to 2-hyd...,isPartOf,kegg.pathway,path:hsa01210,2-Oxocarboxylic acid metabolism - Homo sapiens...
1,reactome,R-HSA-71406,Pyruvate metabolism and Citric Acid (TCA) cycle,isPartOf,kegg.pathway,path:hsa01210,2-Oxocarboxylic acid metabolism - Homo sapiens...
2,kegg.pathway,path:hsa02010,ABC transporters - Homo sapiens (human),equivalentTo,reactome,R-HSA-1369007,Mitochondrial ABC transporters
3,reactome,R-HSA-5683177,Defective ABCC8 can cause hypoglycemias and hy...,isPartOf,kegg.pathway,path:hsa02010,ABC transporters - Homo sapiens (human)
4,reactome,R-HSA-5679001,Defective ABCC2 causes Dubin-Johnson syndrome,isPartOf,kegg.pathway,path:hsa02010,ABC transporters - Homo sapiens (human)


### 1.2. WikiPathways-Reactome Mapping

In [3]:
# Downloading the csv file from GitHub
url = "https://raw.githubusercontent.com/ComPath/compath-resources/master/mappings/wikipathways_reactome.csv" # Make sure the url is the raw version of the file on GitHub
download = requests.get(url).content

# Reading and retrieving it into a pandas dataframe

wp2reactome = pd.read_csv(io.StringIO(download.decode('utf-8')))
wp2reactome.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
0,reactome,R-HSA-163680,AMPK inhibits chREBP transcriptional activatio...,isPartOf,wikipathways,WP1403,AMP-activated Protein Kinase (AMPK) Signaling
1,reactome,R-HSA-176187,Activation of ATR in response to replication s...,isPartOf,wikipathways,WP3875,ATR Signaling
2,wikipathways,WP528,Acetylcholine Synthesis,isPartOf,reactome,R-HSA-1430728,Metabolism
3,wikipathways,WP699,Aflatoxin B1 metabolism,isPartOf,reactome,R-HSA-1430728,Metabolism
4,reactome,R-HSA-5423646,Aflatoxin activation and detoxification,isPartOf,wikipathways,WP699,Aflatoxin B1 metabolism


## 2. Metabolomic pathways filtering

### 2.1. KEGG pathways

#### 2.1.1. `Metabolism` exact match

In [4]:
kegg_match_met_pw = kegg2reactome[(kegg2reactome['Target Name'] =='Metabolism') & kegg2reactome['Source Resource'].isin(['kegg.pathway'])]
kegg_match_met_pw.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
24,kegg.pathway,path:hsa04920,Adipocytokine signaling pathway - Homo sapiens...,isPartOf,reactome,R-HSA-1430728,Metabolism
26,kegg.pathway,path:hsa00250,"Alanine, aspartate and glutamate metabolism - ...",isPartOf,reactome,R-HSA-1430728,Metabolism
27,kegg.pathway,path:hsa04925,Aldosterone synthesis and secretion - Homo sap...,isPartOf,reactome,R-HSA-1430728,Metabolism
31,kegg.pathway,path:hsa00520,Amino sugar and nucleotide sugar metabolism - ...,isPartOf,reactome,R-HSA-1430728,Metabolism
32,kegg.pathway,path:hsa00970,Aminoacyl-tRNA biosynthesis - Homo sapiens (hu...,isPartOf,reactome,R-HSA-1430728,Metabolism


In [5]:
kegg_match_met_pw = kegg_match_met_pw['Source ID']
kegg_match_met_pw[:5]

24    path:hsa04920
26    path:hsa00250
27    path:hsa04925
31    path:hsa00520
32    path:hsa00970
Name: Source ID, dtype: object

#### 2.1.2. `Metabolism` contained

In [6]:
kegg_cont_met_pw = kegg2reactome[kegg2reactome["Target Name"].str.lower().str.contains("metabolism") & kegg2reactome['Source Resource'].isin(['kegg.pathway'])]
kegg_cont_met_pw.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
24,kegg.pathway,path:hsa04920,Adipocytokine signaling pathway - Homo sapiens...,isPartOf,reactome,R-HSA-1430728,Metabolism
25,kegg.pathway,path:hsa00250,"Alanine, aspartate and glutamate metabolism - ...",isPartOf,reactome,R-HSA-71291,Metabolism of amino acids and derivatives
26,kegg.pathway,path:hsa00250,"Alanine, aspartate and glutamate metabolism - ...",isPartOf,reactome,R-HSA-1430728,Metabolism
27,kegg.pathway,path:hsa04925,Aldosterone synthesis and secretion - Homo sap...,isPartOf,reactome,R-HSA-1430728,Metabolism
31,kegg.pathway,path:hsa00520,Amino sugar and nucleotide sugar metabolism - ...,isPartOf,reactome,R-HSA-1430728,Metabolism


In [7]:
kegg_cont_met_pw = kegg_cont_met_pw['Source ID']
kegg_cont_met_pw[:5]

24    path:hsa04920
25    path:hsa00250
26    path:hsa00250
27    path:hsa04925
31    path:hsa00520
Name: Source ID, dtype: object

### 2.2. Reactome pathways

In [8]:
reactome_match_met_pw = kegg2reactome[(kegg2reactome['Target Name'] =='Metabolism') & kegg2reactome['Target Resource'].isin(['reactome'])]
reactome_match_met_pw.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
24,kegg.pathway,path:hsa04920,Adipocytokine signaling pathway - Homo sapiens...,isPartOf,reactome,R-HSA-1430728,Metabolism
26,kegg.pathway,path:hsa00250,"Alanine, aspartate and glutamate metabolism - ...",isPartOf,reactome,R-HSA-1430728,Metabolism
27,kegg.pathway,path:hsa04925,Aldosterone synthesis and secretion - Homo sap...,isPartOf,reactome,R-HSA-1430728,Metabolism
31,kegg.pathway,path:hsa00520,Amino sugar and nucleotide sugar metabolism - ...,isPartOf,reactome,R-HSA-1430728,Metabolism
32,kegg.pathway,path:hsa00970,Aminoacyl-tRNA biosynthesis - Homo sapiens (hu...,isPartOf,reactome,R-HSA-1430728,Metabolism


In [9]:
reactome_match_met_pw = reactome_match_met_pw['Target ID']
reactome_match_met_pw[:5]

24    R-HSA-1430728
26    R-HSA-1430728
27    R-HSA-1430728
31    R-HSA-1430728
32    R-HSA-1430728
Name: Target ID, dtype: object

#### 1.1.2. `Metabolism` contained

In [10]:
reactome_cont_met_pw = kegg2reactome[kegg2reactome["Target Name"].str.lower().str.contains("metabolism") & kegg2reactome['Target Resource'].isin(['reactome'])]
reactome_cont_met_pw.head()


Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
24,kegg.pathway,path:hsa04920,Adipocytokine signaling pathway - Homo sapiens...,isPartOf,reactome,R-HSA-1430728,Metabolism
25,kegg.pathway,path:hsa00250,"Alanine, aspartate and glutamate metabolism - ...",isPartOf,reactome,R-HSA-71291,Metabolism of amino acids and derivatives
26,kegg.pathway,path:hsa00250,"Alanine, aspartate and glutamate metabolism - ...",isPartOf,reactome,R-HSA-1430728,Metabolism
27,kegg.pathway,path:hsa04925,Aldosterone synthesis and secretion - Homo sap...,isPartOf,reactome,R-HSA-1430728,Metabolism
31,kegg.pathway,path:hsa00520,Amino sugar and nucleotide sugar metabolism - ...,isPartOf,reactome,R-HSA-1430728,Metabolism


In [11]:
reactome_cont_met_pw = reactome_cont_met_pw['Target ID']
reactome_cont_met_pw[:5]

24    R-HSA-1430728
25      R-HSA-71291
26    R-HSA-1430728
27    R-HSA-1430728
31    R-HSA-1430728
Name: Target ID, dtype: object

### 2.3. Wikipathways pathways

#### 2.3.1. `Metabolism` exact match

In [12]:
wp_match_met_pw = wp2reactome[(wp2reactome['Target Name'] =='Metabolism') & wp2reactome['Source Resource'].isin(['wikipathways'])]
wp_match_met_pw.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
2,wikipathways,WP528,Acetylcholine Synthesis,isPartOf,reactome,R-HSA-1430728,Metabolism
3,wikipathways,WP699,Aflatoxin B1 metabolism,isPartOf,reactome,R-HSA-1430728,Metabolism
7,wikipathways,WP106,Alanine and aspartate metabolism,isPartOf,reactome,R-HSA-1430728,Metabolism
14,wikipathways,WP3925,Amino Acid metabolism,isPartOf,reactome,R-HSA-1430728,Metabolism
16,wikipathways,WP521,Amino acid conjugation of benzoic acid,isPartOf,reactome,R-HSA-1430728,Metabolism


In [13]:
wp_match_met_pw = wp_match_met_pw['Source ID']
wp_match_met_pw[:5]

2      WP528
3      WP699
7      WP106
14    WP3925
16     WP521
Name: Source ID, dtype: object

#### 2.1.2. `Metabolism` contained

In [14]:
wp_cont_met_pw = wp2reactome[wp2reactome['Target Name'].str.lower().str.contains("metabolism") & wp2reactome['Source Resource'].isin(['wikipathways'])]
wp_cont_met_pw.head()

Unnamed: 0,Source Resource,Source ID,Source Name,Mapping Type,Target Resource,Target ID,Target Name
2,wikipathways,WP528,Acetylcholine Synthesis,isPartOf,reactome,R-HSA-1430728,Metabolism
3,wikipathways,WP699,Aflatoxin B1 metabolism,isPartOf,reactome,R-HSA-1430728,Metabolism
5,wikipathways,WP106,Alanine and aspartate metabolism,isPartOf,reactome,R-HSA-71291,Metabolism of amino acids and derivatives
7,wikipathways,WP106,Alanine and aspartate metabolism,isPartOf,reactome,R-HSA-1430728,Metabolism
12,wikipathways,WP3925,Amino Acid metabolism,equivalentTo,reactome,R-HSA-71291,Metabolism of amino acids and derivatives


In [15]:
wp_cont_met_pw = wp_cont_met_pw['Source ID']
wp_cont_met_pw[:5]

2      WP528
3      WP699
5      WP106
7      WP106
12    WP3925
Name: Source ID, dtype: object

## 3. Gene enties mining from metabolomic pathways