In [1]:
library(tidyverse)

# Custom package
library(rutils)

-- [1mAttaching packages[22m --------------------------------------------------------------------------------------------------------- tidyverse 1.3.0 --

[32mv[39m [34mggplot2[39m 3.3.3     [32mv[39m [34mpurrr  [39m 0.3.4
[32mv[39m [34mtibble [39m 3.0.6     [32mv[39m [34mdplyr  [39m 1.0.4
[32mv[39m [34mtidyr  [39m 1.1.2     [32mv[39m [34mstringr[39m 1.4.0
[32mv[39m [34mreadr  [39m 1.4.0     [32mv[39m [34mforcats[39m 0.5.1

-- [1mConflicts[22m ------------------------------------------------------------------------------------------------------------ tidyverse_conflicts() --
[31mx[39m [34mdplyr[39m::[32mfilter()[39m masks [34mstats[39m::filter()
[31mx[39m [34mdplyr[39m::[32mlag()[39m    masks [34mstats[39m::lag()



In [2]:
dirs <- rutils::get_dev_directories(dev_paths_file = "../dev_paths.txt")
unified_dsets <- c("unified_cervical_data", "unified_uterine_data", "unified_uterine_endometrial_data")

In [3]:
dset_idx <- 1

In [4]:
p_thresh <- 0.05
q_thresh <- 0.1

In [5]:
univ_surv_df <- read_tsv(paste0(dirs$analysis_dir, "/survival/", unified_dsets[dset_idx], "_univ_survival_results.tsv"))
en_cph_df <- read_tsv(paste0(dirs$analysis_dir, "/survival/", unified_dsets[dset_idx], "_en_cph_results.tsv"))
network_mm_gs_df <- read_tsv(paste0(dirs$analysis_dir, "/network/", unified_dsets[dset_idx], "_gene_mm_gs.tsv"))
network_me_sig_df <- read_tsv(paste0(dirs$analysis_dir, "/network/", unified_dsets[dset_idx], "_eigengene_traits.tsv"))


[36m--[39m [1m[1mColumn specification[1m[22m [36m--------------------------------------------------------------------------------------------------------------------------[39m
cols(
  geneID = [31mcol_character()[39m,
  km_pval = [32mcol_double()[39m,
  km_qval = [32mcol_double()[39m,
  cph_pval = [32mcol_double()[39m,
  cph_qval = [32mcol_double()[39m,
  coeff = [32mcol_double()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m--------------------------------------------------------------------------------------------------------------------------[39m
cols(
  geneID = [31mcol_character()[39m,
  coeff = [32mcol_double()[39m
)



[36m--[39m [1m[1mColumn specification[1m[22m [36m--------------------------------------------------------------------------------------------------------------------------[39m
cols(
  .default = col_double(),
  geneID = [31mcol_character()[39m,
  module = [31mcol_character()[39m
)
[36mi[39m Use [30m[47m

# Univariate Survival

In [6]:
sig_univ_df <- univ_surv_df %>%
    dplyr::filter(km_pval < p_thresh | cph_pval < p_thresh) %>%
    dplyr::filter(km_qval < q_thresh | cph_qval < q_thresh)
# sig_univ_df

# Cox PH EN

In [7]:
# en_cph_df

# Joined data

In [8]:
univ_joined_df <- network_mm_gs_df %>%
    dplyr::filter(geneID %in% (sig_univ_df %>% pull(geneID))) %>%
    dplyr::select(geneID, module, mm_cor, mm_pval) %>%
    inner_join(network_me_sig_df, by = "module") %>%
    condense_figo(include_pvals = TRUE)

en_joined_df <- network_mm_gs_df %>%
    dplyr::filter(geneID %in% (en_cph_df %>% pull(geneID))) %>%
    dplyr::select(geneID, module, mm_cor, mm_pval) %>%
    inner_join(network_me_sig_df, by = "module") %>%
    condense_figo(include_pvals = TRUE)

In [9]:
length(union(univ_joined_df$geneID, en_joined_df$geneID))

In [10]:
# univ_joined_df
# en_joined_df

In [11]:
# Number of modules
nrow(network_me_sig_df)

# Unique modules in univ models
nrow(univ_joined_df)
n_univ_mod <- length(unique(univ_joined_df$module))
n_univ_mod
# prop module repeats
1 - n_univ_mod / nrow(univ_joined_df)

# Unique modules in EN model
nrow(en_joined_df)
n_en_mod <- length(unique(en_joined_df$module))
n_en_mod
# prop module repeats
1 - n_en_mod / nrow(en_joined_df)