# Gene term enrichment analysis

In [1]:
library(pathview)
library(dplyr)



##############################################################################
Pathview is an open source software package distributed under GNU General
Public License version 3 (GPLv3). Details of GPLv3 is available at
http://www.gnu.org/licenses/gpl-3.0.html. Particullary, users are required to
formally cite the original Pathview paper (not just mention it) in publications
or products. For details, do citation("pathview") within R.

The pathview downloads and uses KEGG data. Non-academic uses may require a KEGG
license agreement (details at http://www.kegg.jp/kegg/legal.html).
##############################################################################


Attaching package: ‘dplyr’


The following objects are masked from ‘package:stats’:

    filter, lag


The following objects are masked from ‘package:base’:

    intersect, setdiff, setequal, union




## Prep data

In [2]:
inputfile = "../../../differential_expression/_m/genes/diffExpr_szVctl_full.txt"

geneList = data.table::fread(inputfile) %>% na.exclude() %>% 
    tibble::rownames_to_column() %>% select(logFC, EntrezID) %>% 
    distinct(EntrezID, .keep_all=TRUE) %>% 
    tibble::column_to_rownames("EntrezID") %>% as.vector
genes = data.table::fread(inputfile) %>% na.exclude() %>% 
    filter(`adj.P.Val` <= 0.05) %>% tibble::rownames_to_column() %>% 
    select(EntrezID) %>% distinct(EntrezID, .keep_all=TRUE) %>% 
    as.vector

## Pathview plotting

In [3]:
run_pathview <- function(pathwayID, native=TRUE){
    pathview(gene.data=geneList, pathway.id=pathwayID,
         species='hsa', limit=list(gene=0.5, cpd=0.5), 
             kegg.native=native)
}

In [4]:
run_pathview("hsa04020")
run_pathview("hsa00350")

Info: Downloading xml files for hsa04020, 1/1 pathways..

Info: Downloading png files for hsa04020, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04020.pathview.png

Info: Downloading xml files for hsa00350, 1/1 pathways..

Info: Downloading png files for hsa00350, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa00350.pathview.png



In [5]:
run_pathview("hsa04724")
run_pathview("hsa04725")
run_pathview("hsa04726")
run_pathview("hsa04727")

Info: Downloading xml files for hsa04724, 1/1 pathways..

Info: Downloading png files for hsa04724, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04724.pathview.png

Info: Downloading xml files for hsa04725, 1/1 pathways..

Info: Downloading png files for hsa04725, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04725.pathview.png

Info: Downloading xml files for hsa04726, 1/1 pathways..

Info: Downloading png files for hsa04726, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/gith

In [6]:
run_pathview("hsa04728") # dopamine
run_pathview("hsa04728", FALSE)

Info: Downloading xml files for hsa04728, 1/1 pathways..

Info: Downloading png files for hsa04728, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04728.pathview.png

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04728.pathview.pdf



In [7]:
run_pathview("hsa04024")
run_pathview("hsa04540")

Info: Downloading xml files for hsa04024, 1/1 pathways..

Info: Downloading png files for hsa04024, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04024.pathview.png

Info: Downloading xml files for hsa04540, 1/1 pathways..

Info: Downloading png files for hsa04540, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04540.pathview.png



In [8]:
## Circadian
run_pathview("hsa04713")
run_pathview("hsa04710")

Info: Downloading xml files for hsa04713, 1/1 pathways..

Info: Downloading png files for hsa04713, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04713.pathview.png

Info: Downloading xml files for hsa04710, 1/1 pathways..

Info: Downloading png files for hsa04710, 1/1 pathways..

'select()' returned 1:1 mapping between keys and columns

Info: Working in directory /ceph/users/jbenja13/github_projects/LieberInstituteBrainSeqPhase3CaudateSchizophrenia/analysis/differential_expression/kegg_pathways/_m

Info: Writing image file hsa04710.pathview.png



## Session Info

In [9]:
Sys.time()
proc.time()
options(width=120)
sessioninfo::session_info()

[1] "2021-08-05 11:04:08 EDT"

   user  system elapsed 
 33.130   2.285  52.010 

─ Session info ───────────────────────────────────────────────────────────────────────────────────────────────────────
 setting  value                       
 version  R version 4.0.3 (2020-10-10)
 os       Arch Linux                  
 system   x86_64, linux-gnu           
 ui       X11                         
 language (EN)                        
 collate  en_US.UTF-8                 
 ctype    en_US.UTF-8                 
 tz       America/New_York            
 date     2021-08-05                  

─ Packages ───────────────────────────────────────────────────────────────────────────────────────────────────────────
 package       * version  date       lib source        
 AnnotationDbi   1.52.0   2020-10-27 [1] Bioconductor  
 assertthat      0.2.1    2019-03-21 [1] CRAN (R 4.0.2)
 base64enc       0.1-3    2015-07-28 [1] CRAN (R 4.0.2)
 Biobase         2.50.0   2020-10-27 [1] Bioconductor  
 BiocGenerics    0.36.1   2021-04-16 [1] Bioconductor  
 Biostrings      2.58.0   2020-10-2