In [None]:
library(ggplot2)
library(rtracklayer)
library(dplyr)
library(tidyr)
library(data.table)
library(matrixStats)
library(igraph)
library(purrr)
library(stringr)
library(VennDiagram)
library(TIN)
library(disgenet2r)

## Here, I am investigating the Enrichment of different sets of genes/genes of trx in the DisGeNet
### The gene--disease association file was downloaded manually from DisGeNet by selecting some diseases in PDs present in our cidi data from OPTIMA and BeCOME

In [None]:
results_disGeNet_selected_diseases <- read.table('/grehawi/splice-reg-prj/new-data/DISEASES_Summary_GDA_CURATED_selected_updated.tsv', header=TRUE)
head(results_disGeNet_selected_diseases)
dim(results_disGeNet_selected_diseases)

In [None]:
#The disease I chose from DisGENet
unique(results_disGeNet_selected_diseases$Disease)

### Common hubs (dg >=10)

In [None]:
# Check enrichment of genes/genes of trx of the hubs with degree >=10 in both networks (list of 127 nodes)
hubs_intersect_dg10 = read.table("/grehawi/splice-reg-prj/new-data/ARACNE/hubs_intersect.csv",sep = ';', header=TRUE)
hubs_intersect_dg10

In [None]:
#see which disease association we get using only gene-level as input
enrichm_of_hubs_intersect = results_disGeNet_selected_diseases[results_disGeNet_selected_diseases$Gene %in% hubs_intersect_dg10$hubs_intersect & results_disGeNet_selected_diseases$ScoreGDA > 0.4, ]
head(enrichm_of_hubs_intersect)
dim(enrichm_of_hubs_intersect)

In [None]:
#Number of hubs in this intersect set that are associated with PDs
unique(enrichm_of_hubs_intersect$Gene)
#Number of PDs that these genes are found to be associated with
unique(enrichm_of_hubs_intersect$Disease)

In [None]:
enrichm_of_hubs_intersect[enrichm_of_hubs_intersect$Gene %in% c('KCTD12', 'TNFRSF1B'), ]

In [None]:
#see which disease association we get using gene-level as well as trx-level input
enrichm_of_hubs_intersect_with_trx = results_disGeNet_selected_diseases[results_disGeNet_selected_diseases$Gene %in% hubs_intersect_dg10$gene & results_disGeNet_selected_diseases$ScoreGDA > 0.4, ]
head(enrichm_of_hubs_intersect_with_trx)
dim(enrichm_of_hubs_intersect_with_trx)

In [None]:
#Number of hubs in this intersect set that are associated with PDs
unique(enrichm_of_hubs_intersect_with_trx$Gene)
#Number of PDs that these genes are found to be associated with
unique(enrichm_of_hubs_intersect_with_trx$Disease)

### Differential genes and transcripts

In [None]:
# Check enrichment of genes/genes of trx in the set of dyregulated genes/trx in PDs 
genes_up_df = read.table('/grehawi/splice-reg-prj/new-data/Diff-Analysis/genes_up_df.txt', header=TRUE)
genes_down_df = read.table('/grehawi/splice-reg-prj/new-data/Diff-Analysis/genes_down_df.txt', header=TRUE)
trx_up_df = read.table('/grehawi/splice-reg-prj/new-data/Diff-Analysis/trx_up_df.txt', header=TRUE)
trx_down_df = read.table('/grehawi/splice-reg-prj/new-data/Diff-Analysis/trx_down_df.txt', header=TRUE)

In [None]:
# get the gene names of all dyregulated genes and trx 
all_dysreg_genes_trx = unique(c(genes_up_df$gene_name, genes_down_df$gene_name, trx_up_df$gene_name, trx_down_df$gene_name))
length(all_dysreg_genes_trx)

In [None]:
#check the enrichment in PD related genes
enrichm_of_all_dysreg_genes_trx = results_disGeNet_selected_diseases[results_disGeNet_selected_diseases$Gene %in% all_dysreg_genes_trx & results_disGeNet_selected_diseases$ScoreGDA > 0.4, ]
enrichm_of_all_dysreg_genes_trx
dim(enrichm_of_all_dysreg_genes_trx)

In [None]:
#Number of genes that are associated with PDs
unique(enrichm_of_all_dysreg_genes_trx$Gene)
length(unique(enrichm_of_all_dysreg_genes_trx$Gene))
#Number of PDs that these genes are found to be associated with
unique(enrichm_of_all_dysreg_genes_trx$Disease)

In [None]:
length(unique(enrichm_of_all_dysreg_genes_trx$Gene[enrichm_of_all_dysreg_genes_trx$Disease %in% c('MAJOR DEPRESSIVE DISORDER', 'Depressions,Unipolar', 'Major depressive disorder,recurrent episode,unspecified degree',
                                              'Major depressive disorder,single episode,unspecified degree', 'Depression')]))

In [None]:
write.table(enrichm_of_all_dysreg_genes_trx, '/grehawi/splice-reg-prj/new-data/Diff-Analysis/supp_table_DisGeNet_intersection_dysreg_genes_trx.txt', sep=',', row.names = FALSE)