# Gene term enrichment analysis

In [1]:
suppressMessages({
    library(clusterProfiler)
    library(org.Hs.eg.db)
    library(enrichplot)
    library(pathview)})

In [2]:
extract_geneList <- function(dft, keytype='EntrezID'){
    dft = na.exclude(dft)
    gg = as.vector(dft[, 'logFC'])
    names(gg) = as.vector(dft[, keytype])
    gg = sort(gg, decreasing=TRUE)
    return(gg)
}


extract_geneSet <- function(dft, keytype='EntrezID'){
    dft = na.exclude(dft)
    gg = subset(dft, adj.P.Val <= 0.05)
    gene = as.vector(gg[, keytype])
    return(gene)
}


In [3]:
run_pathview <- function(geneList, pathwayID){
    pathview(gene.data = geneList, pathway.id = pathwayID,
             species = 'hsa', limit = list(gene=0.75, cpd=0.75))
}

## Genes

In [4]:
inputfile = "../../_m/genes/diffExpr_szVctl_full.txt"

zz = read.delim(inputfile)
geneList1 = extract_geneList(zz)

In [5]:
aa_uniprot <- merge(bitr(names(geneList1), fromType="ENTREZID",
                         toType=c("UNIPROT", "ENSEMBL"), OrgDb="org.Hs.eg.db"),
                    zz, by.x='ENSEMBL', by.y='ensemblID')
aa_kegg <- merge(bitr_kegg(aa_uniprot[['UNIPROT']], fromType='uniprot',
                           toType='kegg', organism='hsa'), 
                 aa_uniprot, by.x='uniprot', by.y='UNIPROT')

'select()' returned 1:many mapping between keys and columns

“10.11% of input gene IDs are fail to map...”
Reading KEGG annotation online:


“24.32% of input gene IDs are fail to map...”


In [6]:
geneList2 = extract_geneList(aa_kegg, 'kegg')
gene2 = extract_geneSet(aa_kegg, 'kegg')

### Pathview plotting

In [7]:
run_pathview(geneList2, "hsa04020")

Info: Downloading xml files for hsa04020, 1/1 pathways..

Info: Downloading png files for hsa04020, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/sex_differences_sz/interaction_sex_sz/by_sex_sz/caudate/female_analysis/dopamine_system/_m

Info: Writing image file hsa04020.pathview.png



In [8]:
run_pathview(geneList2, "hsa04728")

Info: Downloading xml files for hsa04728, 1/1 pathways..

Info: Downloading png files for hsa04728, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/sex_differences_sz/interaction_sex_sz/by_sex_sz/caudate/female_analysis/dopamine_system/_m

Info: Writing image file hsa04728.pathview.png



In [9]:
run_pathview(geneList2, "hsa04713")

Info: Downloading xml files for hsa04713, 1/1 pathways..

Info: Downloading png files for hsa04713, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/sex_differences_sz/interaction_sex_sz/by_sex_sz/caudate/female_analysis/dopamine_system/_m

Info: Writing image file hsa04713.pathview.png



## Session Info

In [10]:
Sys.time()
proc.time()
options(width=120)
sessioninfo::session_info()

[1] "2021-11-24 12:12:59 EST"

   user  system elapsed 
  9.980   0.380  78.498 

Unnamed: 0_level_0,package,ondiskversion,loadedversion,path,loadedpath,attached,is_base,date,source,md5ok,library
Unnamed: 0_level_1,<chr>,<chr>,<chr>,<chr>,<chr>,<lgl>,<lgl>,<chr>,<chr>,<lgl>,<fct>
AnnotationDbi,AnnotationDbi,1.54.1,1.54.1,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/AnnotationDbi,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/AnnotationDbi,TRUE,FALSE,2021-06-08,Bioconductor,,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
ape,ape,5.5,5.5,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/ape,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/ape,FALSE,FALSE,2021-04-25,CRAN (R 4.1.2),,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
aplot,aplot,0.1.1,0.1.1,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/aplot,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/aplot,FALSE,FALSE,2021-09-22,CRAN (R 4.1.2),,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
assertthat,assertthat,0.2.1,0.2.1,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/assertthat,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/assertthat,FALSE,FALSE,2019-03-21,CRAN (R 4.1.0),,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
base64enc,base64enc,0.1.3,0.1-3,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/base64enc,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/base64enc,FALSE,FALSE,2015-07-28,CRAN (R 4.1.0),,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
Biobase,Biobase,2.52.0,2.52.0,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/Biobase,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/Biobase,TRUE,FALSE,2021-05-19,Bioconductor,,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
BiocGenerics,BiocGenerics,0.38.0,0.38.0,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/BiocGenerics,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/BiocGenerics,TRUE,FALSE,2021-05-19,Bioconductor,,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
BiocParallel,BiocParallel,1.26.2,1.26.2,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/BiocParallel,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/BiocParallel,FALSE,FALSE,2021-08-22,Bioconductor,,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
Biostrings,Biostrings,2.60.2,2.60.2,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/Biostrings,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/Biostrings,FALSE,FALSE,2021-08-05,Bioconductor,,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
bit,bit,4.0.4,4.0.4,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/bit,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1/bit,FALSE,FALSE,2020-08-04,CRAN (R 4.1.0),,/home/kynon/R/x86_64-pc-linux-gnu-library/4.1
