In [1]:
library(tidyverse)

# Custom package
library(rutils)

-- [1mAttaching packages[22m ------------------------------------------------------------------ tidyverse 1.3.0 --

[32mv[39m [34mggplot2[39m 3.3.3     [32mv[39m [34mpurrr  [39m 0.3.4
[32mv[39m [34mtibble [39m 3.0.6     [32mv[39m [34mdplyr  [39m 1.0.4
[32mv[39m [34mtidyr  [39m 1.1.2     [32mv[39m [34mstringr[39m 1.4.0
[32mv[39m [34mreadr  [39m 1.4.0     [32mv[39m [34mforcats[39m 0.5.1

-- [1mConflicts[22m --------------------------------------------------------------------- tidyverse_conflicts() --
[31mx[39m [34mdplyr[39m::[32mfilter()[39m masks [34mstats[39m::filter()
[31mx[39m [34mdplyr[39m::[32mlag()[39m    masks [34mstats[39m::lag()



In [2]:
dirs <- rutils::get_dev_directories(dev_paths_file = "../dev_paths.txt")
projects <- c("CESC", "UCS", "UCEC")
unified_dsets <- c("unified_cervical_data", "unified_uterine_data", "unified_uterine_endometrial_data")
matrisome_path <- paste0(dirs$data_dir, "/matrisome/matrisome_hs_masterlist.tsv")

In [3]:
demg_files <- paste0(dirs$analysis_dir, "/gene_lists/", unified_dsets, "_demg_list.txt")
figo_umsmg_files <- paste0(dirs$analysis_dir, "/gene_lists/", unified_dsets, "_figo_umsmg_list.txt")
figo_nsmg_files <- paste0(dirs$analysis_dir, "/gene_lists/", unified_dsets, "_figo_nsmg_list.txt")
survival_files <- paste0(dirs$analysis_dir, "/gene_lists/", unified_dsets, "_survival_umsmg_list.txt")

In [4]:
save_results <- TRUE

In [5]:
demg_lists <- list()
figo_umsmg_lists <- list()
figo_nsmg_lists <- list()
survival_lists <- list()

for (i in 1:3) {
    demg_lists[[unified_dsets[i]]] <- read_lines(demg_files[i])
    figo_umsmg_lists[[unified_dsets[i]]] <- read_lines(figo_umsmg_files[i])
    figo_nsmg_lists[[unified_dsets[i]]] <- read_lines(figo_nsmg_files[i])
    survival_lists[[unified_dsets[i]]] <- read_lines(survival_files[i])
    
#     figo_umsmg_list <- read_lines(figo_umsmg_files[i])
#     figo_nsmg_list <- read_lines(figo_nsmg_files[i])
#     figo_lists[[unified_dsets[i]]] <- figo_umsmg_list %>%
#         union(figo_nsmg_list)
#     survival_lists[[unified_dsets[i]]] <- read_lines(survival_files[i])
}
matrisome_df <- load_matrisome_df(matrisome_path)


[36m--[39m [1m[1mColumn specification[1m[22m [36m-----------------------------------------------------------------------------------[39m
cols(
  Division = [31mcol_character()[39m,
  Category = [31mcol_character()[39m,
  `Gene Symbol` = [31mcol_character()[39m,
  `Gene Name` = [31mcol_character()[39m,
  Synonyms = [31mcol_character()[39m,
  HGNC_IDs = [32mcol_double()[39m,
  `HGNC_IDs Links` = [32mcol_double()[39m,
  UniProt_IDs = [31mcol_character()[39m,
  Refseq_IDs = [31mcol_character()[39m,
  Orthology = [31mcol_character()[39m,
  Notes = [31mcol_character()[39m
)




In [6]:
l1 <- list(a = c(1, 2, 3), b = c(10, 11, 12))
l2 <- list(a = c(3, 4, 5), b = c(12, 13, 14, 15))

In [7]:
mapply(union, l1, l2)

In [8]:
figo_sig_lists <- mapply(intersect, mapply(union, figo_umsmg_lists, figo_nsmg_lists), demg_lists)
figo_sig_lists %>% map(length)

In [9]:
survival_sig_lists <- mapply(intersect, survival_lists, demg_lists)
survival_sig_lists %>% map(length)

In [10]:
figo_survival_sig_lists <- mapply(intersect, figo_sig_lists, survival_sig_lists)
figo_survival_sig_lists %>% map(length)

In [11]:
demg_all_list <- Reduce(intersect, demg_lists)
demg_all_list %>% length()

In [12]:
figo_all_sig_list <- Reduce(intersect, figo_sig_lists)
figo_all_sig_list %>% length()

In [13]:
survival_all_sig_list <- Reduce(intersect, survival_sig_lists)
survival_all_sig_list %>% length()

In [14]:
demg_all_pairs_list <- demg_lists %>%
    combn(2, simplify = FALSE) %>%
    lapply(function(x) { intersect(x[[1]], x[[2]]) })

demg_all_pairs_list <- setNames(demg_all_pairs_list, c("cesc_ucs", "cesc_ucec", "ucec_ucs"))
demg_all_pairs_list %>% map(length)

In [15]:
figo_all_pairs <- figo_sig_lists %>%
    combn(2, simplify = FALSE) %>%
    lapply(function(x) { intersect(x[[1]], x[[2]]) })

figo_all_pairs <- setNames(figo_all_pairs, c("cesc_ucs", "cesc_ucec", "ucec_ucs"))
figo_all_pairs %>% map(length)

In [16]:
survival_all_pairs <- survival_sig_lists %>%
    combn(2, simplify = FALSE) %>%
    lapply(function(x) { intersect(x[[1]], x[[2]]) })

survival_all_pairs <- setNames(survival_all_pairs, c("cesc_ucs", "cesc_ucec", "ucec_ucs"))
survival_all_pairs %>% map(length)

In [17]:
if (save_results) {
    # FIGO sig
    figo_sig_lists$unified_cervical_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_figo_demg.txt"))
    figo_sig_lists$unified_uterine_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucs_figo_demg.txt"))
    figo_sig_lists$unified_uterine_endometrial_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucec_figo_demg.txt"))
    
    # Survival sig
    survival_sig_lists$unified_cervical_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_survival_demg.txt"))
    survival_sig_lists$unified_uterine_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucs_survival_demg.txt"))
    survival_sig_lists$unified_uterine_endometrial_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucec_survival_demg.txt"))
    
    # FIGO and survival sig
    figo_survival_sig_lists$unified_cervical_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_figo_survival_demg.txt"))
    figo_survival_sig_lists$unified_uterine_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucs_figo_survival_demg.txt"))
    figo_survival_sig_lists$unified_uterine_endometrial_data %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucec_figo_survival_demg.txt"))
    
    # DEMG (all)
    demg_all_list %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/all_demg.txt"))
    
    # FIGO (all)
    figo_all_sig_list %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/all_figo_demg.txt"))
    
    # DEMG pairs
    demg_all_pairs_list$cesc_ucs %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_ucs_demg.txt"))
    demg_all_pairs_list$cesc_ucec %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_ucec_demg.txt"))
    demg_all_pairs_list$ucs_ucec %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucec_ucs_demg.txt"))
    
    # FIGO pairs
    figo_all_pairs$cesc_ucs %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_ucs_figo_demg.txt"))
    figo_all_pairs$cesc_ucec %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_ucec_figo_demg.txt"))
    figo_all_pairs$ucec_ucs %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucec_ucs_figo_demg.txt"))
    
    # Survival pairs
    survival_all_pairs$cesc_ucs %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_ucs_survival_demg.txt"))
    survival_all_pairs$cesc_ucec %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/cesc_ucec_survival_demg.txt"))
    survival_all_pairs$ucec_ucs %>% write_lines(paste0(dirs$analysis_dir, "/gene_lists_extra/ucec_ucs_survival_demg.txt"))
}