In [1]:
library(tidyverse)

# Custom package
library(rutils)

-- [1mAttaching packages[22m ------------------------------------------------------------------------------- tidyverse 1.3.0 --

[32mv[39m [34mggplot2[39m 3.3.3     [32mv[39m [34mpurrr  [39m 0.3.4
[32mv[39m [34mtibble [39m 3.0.6     [32mv[39m [34mdplyr  [39m 1.0.4
[32mv[39m [34mtidyr  [39m 1.1.2     [32mv[39m [34mstringr[39m 1.4.0
[32mv[39m [34mreadr  [39m 1.4.0     [32mv[39m [34mforcats[39m 0.5.1

-- [1mConflicts[22m ---------------------------------------------------------------------------------- tidyverse_conflicts() --
[31mx[39m [34mdplyr[39m::[32mfilter()[39m masks [34mstats[39m::filter()
[31mx[39m [34mdplyr[39m::[32mlag()[39m    masks [34mstats[39m::lag()



In [2]:
dirs <- rutils::get_dev_directories(dev_paths_file = "../dev_paths.txt")
unified_dsets <- c("unified_cervical_data", "unified_uterine_data", "unified_uterine_endometrial_data")

In [3]:
dset_idx <- 2
save_res <- TRUE

In [4]:
gene2id_df <- read_tsv(paste0(dirs$data_dir, "/", unified_dsets[dset_idx], "/hugo2entrez.tsv")) %>%
    mutate(entrez_gene_id = as.character(entrez_gene_id)) %>%
    rename(entrez = entrez_gene_id, geneID = hugo_symbol)
dge_res_df <- read_tsv(paste0(dirs$analysis_dir, "/deg/", unified_dsets[dset_idx], "_DESeq_results.tsv"))


[36m--[39m [1m[1mColumn specification[1m[22m [36m------------------------------------------------------------------------------------------------[39m
cols(
  hugo_symbol = [31mcol_character()[39m,
  entrez_gene_id = [32mcol_double()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m------------------------------------------------------------------------------------------------[39m
cols(
  geneID = [31mcol_character()[39m,
  baseMean = [32mcol_double()[39m,
  log2FoldChange = [32mcol_double()[39m,
  lfcSE = [32mcol_double()[39m,
  stat = [32mcol_double()[39m,
  pvalue = [32mcol_double()[39m,
  padj = [32mcol_double()[39m,
  qval = [32mcol_double()[39m
)




In [5]:
set <- "figo"
ea_dir <- paste0(dirs$analysis_dir, "/enrichment/", unified_dsets[dset_idx], "_", set, "_kegg")
ea_files_short <- list.files(ea_dir)
ea_files_long <- list.files(ea_dir, full.names = TRUE)

In [6]:
# ea_dfs <- list.files(ea_dir, full.names = TRUE) %>% purrr::map(read_tsv)
ea_dfs <- list()
for (i in seq_len(length(ea_files_short))) {
    pwy <- str_replace(ea_files_short[i], ".tsv", "")
    ea_dfs[[pwy]] <- read_tsv(ea_files_long[i], col_names = FALSE) %>%
        mutate(pathway = pwy) %>%
        rename(entrez = X1, color = X2) %>%
        mutate(entrez = as.character(entrez)) %>%
        select(-color)
}


[36m--[39m [1m[1mColumn specification[1m[22m [36m------------------------------------------------------------------------------------------------[39m
cols(
  X1 = [32mcol_double()[39m,
  X2 = [31mcol_character()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m------------------------------------------------------------------------------------------------[39m
cols(
  X1 = [32mcol_double()[39m,
  X2 = [31mcol_character()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m------------------------------------------------------------------------------------------------[39m
cols(
  X1 = [32mcol_double()[39m,
  X2 = [31mcol_character()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m------------------------------------------------------------------------------------------------[39m
cols(
  X1 = [32mcol_double()[39m,
  X2 = [31mcol_character()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m-----------

# Look at breakdowns

In [9]:
bind_rows(ea_dfs) %>%
    inner_join(gene2id_df, by = "entrez") %>%
    inner_join(dge_res_df, by = "geneID") %>%
    mutate(de_dir = ifelse(log2FoldChange > 0, "UP", "DOWN")) %>%
    select(geneID, entrez, pathway, de_dir) %>%
    filter(pathway == "mapk_signaling_pathway") %>%
    arrange(de_dir, geneID)

geneID,entrez,pathway,de_dir
<chr>,<chr>,<chr>,<chr>
FGF10,2255,mapk_signaling_pathway,DOWN
FGF16,8823,mapk_signaling_pathway,DOWN
FGF7,2252,mapk_signaling_pathway,DOWN
KITLG,4254,mapk_signaling_pathway,DOWN
FGF19,9965,mapk_signaling_pathway,UP
FGF5,2250,mapk_signaling_pathway,UP
FGF8,2253,mapk_signaling_pathway,UP
IL1A,3552,mapk_signaling_pathway,UP
PGF,5228,mapk_signaling_pathway,UP
TGFB2,7042,mapk_signaling_pathway,UP
