In [None]:
source(paste0(dirname(getwd()),'/map.r'))
source(paste0(HELP_DIR, "shortcuts.r"))
library( readxl )

In [None]:
patients <- list.files(ISOFOX_DIR)

#### 0 - Collected and process adjusted TPMs from files

In [None]:
iso <- fread(paste0(TMP_DIR, "isofox_adj_tmp.csv"))

In [None]:
iso_base <- log(data.frame(t(iso %>% select(-GeneId) %>% column_to_rownames("GeneName"))) + 1)

- Selected genes prior knowledge

In [None]:
mrp_genes <- c("ABCC1", "ABCC2", "ABCC3", "ABCC4", "ABCC5", "ABCC6", "ABCC10", "ABCC11", "ABCC12")
more_markers <- c("ESR1", "ERBB2", "CD274", "MGMT", "BRCA1", "BRCA2", "EGFR", "ALK", "BCL2", "AR", "TOP2A", "TYMS", "ERCC1", "MET", "KRAS")
marker_genes <- c(mrp_genes, more_markers)

In [None]:
biomarker_genes <-
iso_base %>% 
 se(any_of(marker_genes)) %>% 
 rownames_to_column("sampleId")

In [None]:
colnames(biomarker_genes) <- c("sampleId", paste0("rna_marker_", colnames(biomarker_genes)[-1]))

In [None]:
fwrite( biomarker_genes, paste0(READY_DIR, "biomarker_genes_ready.csv"))

#### 1 - Add in Gene Sets

In [None]:
gene_sets <- readRDS(paste0(REF_DIR, 'gene_sets.Rds'))

- Add MP sets

In [None]:
cell_types <- c("B_cells", "Endothelial", "Epithelial", "Fibroblasts", "Macrophages","CD4", "CD8", "Malignant")

In [None]:
mps <- list()
for(i in cell_types){
    tmp <- read_excel(paste0(REF_DIR, "/41586_2023_6130_MOESM14_ESM.xlsx"), sheet = i)
    names(tmp) <- paste0("mp_", i, "_", names(tmp))
    gene_sets <- c(gene_sets, as.list(tmp))
}
saveRDS(gene_sets, paste0(REF_DIR, 'gene_sets_full.Rds'))

In [None]:
computer <- function( i, df ) {
  tmp <- data.frame( apply(df %>% select(any_of(gene_sets[[i]])),1,mean) )
  colnames(tmp) <- i
  tmp %>% rownames_to_column("sampleId")
}

In [None]:
computed_sets <- list()
system.time(
for( i in names(gene_sets)){ 
  computed_sets[[i]] <- computer(i, iso_base)
})

In [None]:
gene_sets_base <- computed_sets %>% reduce(inner_join, by = "sampleId")

#### 2 - Send the files

- Isofox gene expression

In [None]:
isofox_ready <- iso_base
colnames(isofox_ready) <- paste0("rna_", colnames(iso_base))
isofox_ready <- isofox_ready %>% rownames_to_column("sampleId")

In [None]:
fwrite( isofox_ready, paste0(READY_DIR, "isofox_genes_ready.csv") )

- Add gene sets

In [None]:
gene_sets_ready <- gene_sets_base
colnames(gene_sets_ready) <- c("sampleId", paste0("rna_geneset_", colnames(gene_sets_base)[-1]))

In [None]:
fwrite( gene_sets_ready, paste0(READY_DIR, "isofox_genesets_ready.csv"))