# Pathway analysis of metagenomic data

First, install the libraries and import them


In [None]:
if (!require("BiocManager", quietly = TRUE))
    install.packages("BiocManager")

BiocManager::install("clusterProfiler")
BiocManager::install("org.Hs.eg.db")
BiocManager::install("org.EcK12.eg.db")
BiocManager::install("KEGGREST")

In [None]:
library(clusterProfiler)
library(KEGGREST)
library(org.Hs.eg.db)
library(org.EcK12.eg.db)
#keytypes(org.EcK12.eg.db)

# Import the metagenomics data
metagenomics <- read.csv(file = '../Data/ecs_relab_split.csv', sep = '\t', header = TRUE)
head (metagenomics)

## KEGG pathway over-representation analysis

In [None]:
# Convert EC numbers to Entrez IDs
gene <- clusterProfiler::bitr(metagenomics$Gene.Family,fromType = "ENZYME",toType = "ENTREZID",OrgDb = org.EcK12.eg.db)

# Convert Entrez IDs to KEGG IDs
geneList <- sub("^", "ncbi-geneid:", gene[,2])
geneList <- keggConv("eco", geneList)

In [30]:
# Remove preceding 'eco:'
geneList <- gsub("eco:", "", geneList)

kk <- enrichKEGG(gene         = geneList,
                 organism     = 'eco',
                 pvalueCutoff = 0.05)
head(kk)

Unnamed: 0_level_0,ID,Description,GeneRatio,BgRatio,pvalue,p.adjust,qvalue,geneID,Count
Unnamed: 0_level_1,<chr>,<chr>,<chr>,<chr>,<dbl>,<dbl>,<dbl>,<chr>,<int>
eco01110,eco01110,Biosynthesis of secondary metabolites,295/874,339/1722,6.180597e-55,5.1917020000000005e-53,1.756591e-53,b4471/b4395/b4388/b4384/b4268/b4254/b4232/b4171/b4160/b4154/b4153/b4131/b4122/b4090/b4069/b4054/b4042/b4041/b4039/b4025/b4024/b4019/b4015/b4014/b4013/b4006/b4005/b3997/b3960/b3959/b3958/b3957/b3942/b3940/b3939/b3930/b3925/b3919/b3918/b3916/b3867/b3850/b3846/b3845/b3829/b3821/b3809/b3805/b3804/b3803/b3789/b3788/b3774/b3772/b3771/b3770/b3769/b3744/b3671/b3670/b3612/b3608/b3607/b3589/b3572/b3571/b3553/b3519/b3517/b3437/b3433/b3432/b3430/b3429/b3428/b3426/b3417/b3416/b3403/b3390/b3389/b3386/b3385/b3368/b3359/b3281/b3256/b3236/b3213/b3212/b3172/b3124/b3117/b3059/b3041/b3018/b3008/b2979/b2976/b2965/b2957/b2942/b2935/b2926/b2925/b2914/b2913/b2905/b2903/b2889/b2844/b2838/b2818/b2797/b2779/b2752/b2751/b2747/b2746/b2744/b2601/b2600/b2599/b2585/b2557/b2551/b2533/b2518/b2515/b2508/b2500/b2499/b2478/b2476/b2465/b2464/b2436/b2414/b2400/b2388/b2342/b2341/b2329/b2316/b2312/b2290/b2265/b2264/b2263/b2262/b2261/b2260/b2243/b2242/b2241/b2232/b2224/b2210/b2132/b2097/b2049/b2048/b2042/b2041/b2040/b2039/b2038/b2029/b2026/b2024/b2022/b2021/b2020/b2019/b1927/b1897/b1896/b1854/b1852/b1849/b1814/b1780/b1779/b1767/b1732/b1723/b1704/b1702/b1693/b1692/b1676/b1662/b1622/b1617/b1613/b1612/b1611/b1493/b1478/b1409/b1393/b1386/b1288/b1277/b1276/b1264/b1263/b1262/b1261/b1260/b1241/b1236/b1210/b1208/b1207/b1197/b1136/b1131/b1093/b1092/b1090/b1033/b1014/b0928/b0908/b0907/b0870/b0771/b0767/b0756/b0755/b0754/b0729/b0728/b0727/b0726/b0724/b0723/b0720/b0693/b0688/b0674/b0596/b0595/b0594/b0593/b0523/b0522/b0514/b0480/b0475/b0474/b0425/b0421/b0420/b0414/b0403/b0394/b0388/b0386/b0369/b0356/b0273/b0261/b0243/b0242/b0238/b0186/b0185/b0175/b0174/b0173/b0154/b0134/b0133/b0131/b0125/b0124/b0118/b0116/b0115/b0114/b0078/b0077/b0074/b0073/b0072/b0071/b0031/b0029/b0025/b0008/b0004/b0003/b0002,295
eco01230,eco01230,Biosynthesis of amino acids,115/874,117/1722,4.947445e-33,2.0779270000000003e-31,7.03058e-32,b4471/b4395/b4388/b4254/b4090/b4054/b4024/b4019/b4013/b3960/b3959/b3958/b3957/b3940/b3939/b3919/b3916/b3870/b3829/b3809/b3774/b3772/b3771/b3770/b3769/b3744/b3671/b3670/b3612/b3607/b3433/b3390/b3389/b3386/b3359/b3281/b3213/b3212/b3172/b3117/b3008/b2942/b2935/b2926/b2925/b2914/b2913/b2838/b2818/b2797/b2779/b2687/b2601/b2600/b2599/b2551/b2478/b2472/b2465/b2464/b2421/b2414/b2329/b2290/b2097/b2026/b2024/b2022/b2021/b2020/b2019/b1854/b1814/b1779/b1723/b1704/b1693/b1676/b1622/b1276/b1264/b1263/b1262/b1261/b1260/b1207/b1136/b0928/b0908/b0907/b0870/b0771/b0755/b0754/b0720/b0674/b0388/b0386/b0273/b0243/b0242/b0166/b0159/b0118/b0078/b0077/b0074/b0073/b0072/b0071/b0031/b0008/b0004/b0003/b0002,115
eco01120,eco01120,Microbial metabolism in diverse environments,212/874,268/1722,2.900829e-25,8.12232e-24,2.748153e-24,b4478/b4395/b4388/b4268/b4232/b4198/b4197/b4196/b4195/b4194/b4154/b4153/b4131/b4122/b4090/b4079/b4070/b4069/b4025/b4024/b4015/b4014/b3956/b3941/b3940/b3925/b3919/b3916/b3904/b3903/b3902/b3894/b3893/b3892/b3870/b3846/b3845/b3830/b3809/b3805/b3804/b3803/b3612/b3607/b3589/b3583/b3581/b3553/b3526/b3517/b3437/b3433/b3403/b3386/b3368/b3366/b3365/b3359/b3355/b3256/b3236/b3213/b3212/b3124/b3114/b3073/b2997/b2994/b2979/b2976/b2935/b2926/b2925/b2917/b2914/b2913/b2874/b2867/b2866/b2844/b2838/b2803/b2802/b2800/b2799/b2779/b2764/b2763/b2762/b2752/b2751/b2750/b2662/b2661/b2551/b2542/b2539/b2538/b2521/b2478/b2472/b2465/b2464/b2463/b2414/b2400/b2388/b2342/b2341/b2316/b2297/b2296/b2247/b2224/b2222/b2221/b2210/b2206/b2167/b2154/b2133/b2097/b2029/b1970/b1854/b1852/b1851/b1850/b1780/b1779/b1761/b1723/b1702/b1676/b1638/b1612/b1611/b1493/b1478/b1468/b1467/b1465/b1444/b1415/b1398/b1395/b1394/b1393/b1385/b1380/b1302/b1276/b1241/b1227/b1225/b1224/b1210/b1207/b1136/b1033/b1002/b0997/b0973/b0972/b0968/b0963/b0907/b0903/b0870/b0771/b0767/b0756/b0755/b0729/b0728/b0727/b0726/b0724/b0723/b0720/b0688/b0578/b0529/b0521/b0517/b0516/b0514/b0512/b0369/b0356/b0355/b0352/b0351/b0350/b0348/b0323/b0285/b0284/b0186/b0185/b0166/b0154/b0118/b0116/b0115/b0114/b0061/b0031/b0008/b0004/b0003/b0002,212
eco01200,eco01200,Carbon metabolism,101/874,110/1722,1.267216e-21,2.6611529999999998e-20,9.0039e-21,b4471/b4395/b4388/b4268/b4232/b4154/b4153/b4122/b4090/b4079/b4069/b4025/b4015/b4014/b3956/b3941/b3925/b3919/b3916/b3894/b3893/b3892/b3846/b3772/b3612/b3607/b3526/b3437/b3403/b3386/b3355/b3256/b3236/b3117/b2976/b2935/b2926/b2925/b2917/b2914/b2913/b2905/b2903/b2874/b2844/b2797/b2779/b2551/b2465/b2464/b2463/b2414/b2388/b2341/b2316/b2297/b2296/b2224/b2210/b2154/b2097/b2029/b1854/b1852/b1851/b1850/b1814/b1779/b1732/b1723/b1702/b1676/b1612/b1611/b1479/b1395/b1276/b1207/b1136/b0907/b0771/b0767/b0755/b0729/b0728/b0727/b0726/b0724/b0723/b0720/b0529/b0521/b0356/b0355/b0323/b0185/b0118/b0116/b0115/b0114/b0008,101
eco01240,eco01240,Biosynthesis of cofactors,110/874,140/1722,1.541481e-12,2.589689e-11,8.762105e-12,b4386/b4245/b4177/b4039/b3997/b3993/b3974/b3930/b3867/b3850/b3805/b3804/b3803/b3770/b3642/b3639/b3634/b3368/b3360/b3177/b3058/b3041/b2947/b2942/b2927/b2780/b2765/b2688/b2615/b2574/b2564/b2551/b2530/b2518/b2459/b2436/b2418/b2400/b2323/b2320/b2315/b2265/b2264/b2263/b2262/b2261/b2260/b2232/b2153/b2104/b2103/b2042/b2028/b1993/b1992/b1991/b1812/b1768/b1740/b1662/b1638/b1636/b1617/b1613/b1593/b1288/b1281/b1277/b1270/b1236/b1210/b1131/b1096/b1095/b1093/b1062/b0945/b0931/b0907/b0778/b0776/b0775/b0774/b0750/b0639/b0638/b0630/b0628/b0529/b0475/b0474/b0425/b0417/b0414/b0383/b0369/b0171/b0154/b0142/b0134/b0133/b0131/b0116/b0109/b0103/b0052/b0048/b0033/b0032/b0025,110
eco00630,eco00630,Glyoxylate and dicarboxylate metabolism,39/874,42/1722,3.363615e-09,4.709062e-08,1.593292e-08,b4069/b4015/b4014/b3894/b3893/b3892/b3870/b3553/b3385/b3236/b3125/b3124/b3062/b3061/b2979/b2976/b2917/b2905/b2903/b2844/b2799/b2551/b2373/b2224/b1850/b1800/b1732/b1415/b1276/b1232/b1033/b0771/b0720/b0514/b0509/b0508/b0507/b0118/b0116,39
