In [17]:
setwd("/Users/rebecca/sudmant/analyses/myotis/analysis/exploratory/species_peaks")

library(GSA)
library(dplyr)
library(qvalue)
library(ggplot2)
library(data.table)

source("/Users/rebecca/sudmant/analyses/myotis/code/fisher_test.R")

shared_genes <- fread("results/data/shared_genes.csv", data.table = FALSE)

In [None]:
## Load in Broad gene sets:
gsc <- GSA.read.gmt("/Users/rebecca/sudmant/analyses/myotis/data/genesets/msigdb_v2023.2.Hs_GMTs/msigdb.v2023.2.Hs.symbols.gmt")
sets <- gsc$genesets
names(sets) <- gsc$geneset.names
sets <- sets[grep("^REACTOME|^GOBP", names(sets))]

## Shared peaks

In [19]:
shared_peaks <- fread("results/data/shared_promoters_shared_peaks.csv", data.table = FALSE)
shared_peak_enrichments <- sort(unlist(lapply(sets, fisher_test,
                                              mod = shared_peaks$Gene,
                                              all = shared_genes$Gene)))
shared_peak_enrich_df <- data.frame(Set = names(shared_peak_enrichments), 
                                    Pval = shared_peak_enrichments,
                                    row.names = NULL)
shared_peak_enrich_df$Qval <- qvalue(shared_peak_enrich_df$Pval)$qvalues
head(shared_peak_enrich_df, 15)

Unnamed: 0_level_0,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<dbl>,<dbl>
1,REACTOME_DNA_DAMAGE_TELOMERE_STRESS_INDUCED_SENESCENCE,0.000104751,0.9782699
2,REACTOME_COPI_MEDIATED_ANTEROGRADE_TRANSPORT,0.0003555364,1.0
3,REACTOME_COPI_DEPENDENT_GOLGI_TO_ER_RETROGRADE_TRAFFIC,0.000596044,1.0
4,REACTOME_RECOGNITION_AND_ASSOCIATION_OF_DNA_GLYCOSYLASE_WITH_SITE_CONTAINING_AN_AFFECTED_PURINE,0.0006966203,1.0
5,REACTOME_HATS_ACETYLATE_HISTONES,0.0009213978,1.0
6,REACTOME_BASE_EXCISION_REPAIR_AP_SITE_FORMATION,0.0011013265,1.0
7,REACTOME_GOLGI_TO_ER_RETROGRADE_TRANSPORT,0.0012272583,1.0
8,REACTOME_INHIBITION_OF_DNA_RECOMBINATION_AT_TELOMERE,0.0012560298,1.0
9,REACTOME_ER_TO_GOLGI_ANTEROGRADE_TRANSPORT,0.001656959,1.0
10,REACTOME_VIRAL_INFECTION_PATHWAYS,0.0018859275,1.0


In [11]:
shared_peaks$Gene

### No significant enrichments in shared peaks

## Semi-shared peaks

In [20]:
semi_shared_peaks <- fread("results/data/shared_promoters_semi_shared_peaks.csv", data.table = FALSE)

species <- unique(semi_shared_peaks$Species)
                                                                                 
missing_peak_enrichments <- lapply(species, function(spec){
  
  missing_peaks_spec <- semi_shared_peaks[semi_shared_peaks$Species %in% spec,]
  missing_peaks_enrich <- sort(unlist(lapply(sets, fisher_test,
                                             mod = missing_peaks_spec$Gene,
                                             all = shared_genes$Gene)))
  return(data.frame(Species = spec,
                    Set = names(missing_peaks_enrich), 
                    Pval = missing_peaks_enrich,
                    Qval = qvalue(missing_peaks_enrich)$qvalues,
                    row.names = NULL))
  
})
names(missing_peak_enrichments) <- species

In [14]:
tapply(semi_shared_peaks$Gene, semi_shared_peaks$Species, "[")

In [21]:
lapply(missing_peak_enrichments, head, 10)

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Lucifugus,GOBP_SINGLE_FERTILIZATION,0.0004596155,1
2,Myotis-Lucifugus,GOBP_FERTILIZATION,0.000666211,1
3,Myotis-Lucifugus,GOBP_POSITIVE_REGULATION_OF_MEMORY_T_CELL_DIFFERENTIATION,0.0019022251,1
4,Myotis-Lucifugus,REACTOME_DNA_METHYLATION,0.0026623547,1
5,Myotis-Lucifugus,REACTOME_FOLDING_OF_ACTIN_BY_CCT_TRIC,0.0026623547,1
6,Myotis-Lucifugus,GOBP_IMMUNOLOGICAL_MEMORY_FORMATION_PROCESS,0.0026623547,1
7,Myotis-Lucifugus,GOBP_NEGATIVE_REGULATION_OF_COMPLEMENT_ACTIVATION,0.0026623547,1
8,Myotis-Lucifugus,GOBP_NEGATIVE_REGULATION_OF_HUMORAL_IMMUNE_RESPONSE_MEDIATED_BY_CIRCULATING_IMMUNOGLOBULIN,0.0026623547,1
9,Myotis-Lucifugus,GOBP_POSITIVE_REGULATION_OF_ESTABLISHMENT_OF_PROTEIN_LOCALIZATION_TO_TELOMERE,0.0026623547,1
10,Myotis-Lucifugus,GOBP_REGULATION_OF_COMPLEMENT_ACTIVATION_CLASSICAL_PATHWAY,0.0026623547,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Californicus,GOBP_RESPONSE_TO_OXIDATIVE_STRESS,0.0001291264,1
2,Myotis-Californicus,GOBP_SYNCYTIUM_FORMATION,0.0009563998,1
3,Myotis-Californicus,GOBP_MAPK_CASCADE,0.001248395,1
4,Myotis-Californicus,GOBP_GRANULOCYTE_CHEMOTAXIS,0.002688056,1
5,Myotis-Californicus,GOBP_POSITIVE_REGULATION_OF_MAPK_CASCADE,0.003409799,1
6,Myotis-Californicus,REACTOME_APOBEC3G_MEDIATED_RESISTANCE_TO_HIV_1_INFECTION,0.0034223756,1
7,Myotis-Californicus,GOBP_COPI_COATED_VESICLE_BUDDING,0.0034223756,1
8,Myotis-Californicus,GOBP_REGULATION_OF_MACROPHAGE_FUSION,0.0034223756,1
9,Myotis-Californicus,GOBP_RESPONSE_TO_CALCIUM_ION,0.0035955633,1
10,Myotis-Californicus,GOBP_GRANULOCYTE_MIGRATION,0.0039564469,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Thysanodes,GOBP_POSITIVE_REGULATION_OF_SYNAPTIC_VESICLE_FUSION_TO_PRESYNAPTIC_ACTIVE_ZONE_MEMBRANE,0.001141715,1
2,Myotis-Thysanodes,GOBP_EPOXIDE_METABOLIC_PROCESS,0.001712166,1
3,Myotis-Thysanodes,GOBP_LIPOXIN_METABOLIC_PROCESS,0.001712166,1
4,Myotis-Thysanodes,GOBP_NEGATIVE_REGULATION_OF_PLATELET_AGGREGATION,0.001712166,1
5,Myotis-Thysanodes,REACTOME_SYNTHESIS_OF_12_EICOSATETRAENOIC_ACID_DERIVATIVES,0.002282344,1
6,Myotis-Thysanodes,REACTOME_SYNTHESIS_OF_LIPOXINS_LX,0.002282344,1
7,Myotis-Thysanodes,GOBP_GOLGI_DISASSEMBLY,0.002282344,1
8,Myotis-Thysanodes,GOBP_HEPOXILIN_METABOLIC_PROCESS,0.002282344,1
9,Myotis-Thysanodes,GOBP_POSITIVE_REGULATION_OF_VESICLE_FUSION,0.002282344,1
10,Myotis-Thysanodes,GOBP_REGULATION_OF_CHAPERONE_MEDIATED_AUTOPHAGY,0.002282344,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Occultus,GOBP_DNA_INTEGRATION,0.001521997,1
2,Myotis-Occultus,GOBP_REGULATION_OF_DNA_TOPOISOMERASE_ATP_HYDROLYZING_ACTIVITY,0.001521997,1
3,Myotis-Occultus,GOBP_CALCIUM_ION_EXPORT_ACROSS_PLASMA_MEMBRANE,0.002282344,1
4,Myotis-Occultus,GOBP_REGULATION_OF_ISOMERASE_ACTIVITY,0.002282344,1
5,Myotis-Occultus,GOBP_DNA_DOUBLE_STRAND_BREAK_PROCESSING,0.003801735,1
6,Myotis-Occultus,GOBP_POSITIVE_REGULATION_OF_DOUBLE_STRAND_BREAK_REPAIR_VIA_NONHOMOLOGOUS_END_JOINING,0.003801735,1
7,Myotis-Occultus,REACTOME_FORMATION_OF_ATP_BY_CHEMIOSMOTIC_COUPLING,0.004560779,1
8,Myotis-Occultus,GOBP_NUCLEIC_ACID_PHOSPHODIESTER_BOND_HYDROLYSIS,0.005698532,1
9,Myotis-Occultus,GOBP_REGULATION_OF_DOUBLE_STRAND_BREAK_REPAIR_VIA_NONHOMOLOGOUS_END_JOINING,0.006077567,1
10,Myotis-Occultus,REACTOME_CRISTAE_FORMATION,0.006456492,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Volans,GOBP_CELLULAR_KETONE_METABOLIC_PROCESS,0.002661514,1
2,Myotis-Volans,GOBP_REGULATION_OF_LONG_CHAIN_FATTY_ACID_IMPORT_INTO_CELL,0.002852251,1
3,Myotis-Volans,GOBP_REGULATION_OF_PHOSPHATIDYLCHOLINE_BIOSYNTHETIC_PROCESS,0.002852251,1
4,Myotis-Volans,GOBP_CYCLOOXYGENASE_PATHWAY,0.003421887,1
5,Myotis-Volans,REACTOME_AKT_PHOSPHORYLATES_TARGETS_IN_THE_CYTOSOL,0.003991252,1
6,Myotis-Volans,GOBP_POSITIVE_REGULATION_OF_PHOSPHOLIPID_BIOSYNTHETIC_PROCESS,0.003991252,1
7,Myotis-Volans,GOBP_REGULATION_OF_PHOSPHATIDYLCHOLINE_METABOLIC_PROCESS,0.003991252,1
8,Myotis-Volans,GOBP_VITAMIN_K_METABOLIC_PROCESS,0.003991252,1
9,Myotis-Volans,GOBP_POSITIVE_REGULATION_OF_PHOSPHOLIPID_METABOLIC_PROCESS,0.005129169,1
10,Myotis-Volans,REACTOME_SYNTHESIS_OF_PROSTAGLANDINS_PG_AND_THROMBOXANES_TX,0.00569772,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Auriculus,REACTOME_CELLULAR_RESPONSES_TO_STIMULI,0.001781509,1
2,Myotis-Auriculus,GOBP_MITOCHONDRIAL_ELECTRON_TRANSPORT_CYTOCHROME_C_TO_OXYGEN,0.002853066,1
3,Myotis-Auriculus,REACTOME_CYTOPROTECTION_BY_HMOX1,0.00721985,1
4,Myotis-Auriculus,REACTOME_EUKARYOTIC_TRANSLATION_ELONGATION,0.009115463,1
5,Myotis-Auriculus,GOBP_TRANSLATIONAL_ELONGATION,0.009304925,1
6,Myotis-Auriculus,REACTOME_TP53_REGULATES_METABOLIC_GENES,0.009873201,1
7,Myotis-Auriculus,REACTOME_RESPONSE_OF_EIF2AK4_GCN2_TO_AMINO_ACID_DEFICIENCY,0.010630649,1
8,Myotis-Auriculus,REACTOME_SRP_DEPENDENT_COTRANSLATIONAL_PROTEIN_TARGETING_TO_MEMBRANE,0.011198545,1
9,Myotis-Auriculus,REACTOME_NONSENSE_MEDIATED_DECAY_NMD,0.011577052,1
10,Myotis-Auriculus,GOBP_ATP_SYNTHESIS_COUPLED_ELECTRON_TRANSPORT,0.011766278,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Evotis,GOBP_NEGATIVE_REGULATION_OF_DENDRITE_DEVELOPMENT,0.002852251,1
2,Myotis-Evotis,REACTOME_UPTAKE_OF_DIETARY_COBALAMINS_INTO_ENTEROCYTES,0.003326993,1
3,Myotis-Evotis,REACTOME_SIGNALING_BY_FGFR2_IIIA_TM,0.003801554,1
4,Myotis-Evotis,REACTOME_ABORTIVE_ELONGATION_OF_HIV_1_TRANSCRIPT_IN_THE_ABSENCE_OF_TAT,0.004275935,1
5,Myotis-Evotis,REACTOME_FGFR2_ALTERNATIVE_SPLICING,0.004275935,1
6,Myotis-Evotis,REACTOME_MICRORNA_MIRNA_BIOGENESIS,0.004750134,1
7,Myotis-Evotis,REACTOME_HIV_ELONGATION_ARREST_AND_RECOVERY,0.006171649,1
8,Myotis-Evotis,REACTOME_MRNA_CAPPING,0.006645126,1
9,Myotis-Evotis,REACTOME_FORMATION_OF_THE_EARLY_ELONGATION_COMPLEX,0.007118422,1
10,Myotis-Evotis,REACTOME_COBALAMIN_CBL_VITAMIN_B12_TRANSPORT_AND_METABOLISM,0.007591538,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Yumanensis,REACTOME_PKR_MEDIATED_SIGNALING,0.0004753469,1
2,Myotis-Yumanensis,GOBP_REGULATION_OF_MICROTUBULE_POLYMERIZATION_OR_DEPOLYMERIZATION,0.0008457187,1
3,Myotis-Yumanensis,GOBP_HEAT_ACCLIMATION,0.0008564903,1
4,Myotis-Yumanensis,GOBP_MICROTUBULE_POLYMERIZATION_OR_DEPOLYMERIZATION,0.0020399816,1
5,Myotis-Yumanensis,REACTOME_ANTIVIRAL_MECHANISM_BY_IFN_STIMULATED_GENES,0.0022961628,1
6,Myotis-Yumanensis,GOBP_POSITIVE_REGULATION_OF_NUCLEASE_ACTIVITY,0.0025675149,1
7,Myotis-Yumanensis,GOBP_REGULATION_OF_MICROTUBULE_CYTOSKELETON_ORGANIZATION,0.0027362163,1
8,Myotis-Yumanensis,GOBP_AXONEMAL_CENTRAL_APPARATUS_ASSEMBLY,0.0034220501,1
9,Myotis-Yumanensis,GOBP_CAP_DEPENDENT_TRANSLATIONAL_INITIATION,0.0034220501,1
10,Myotis-Yumanensis,GOBP_ISG15_PROTEIN_CONJUGATION,0.0034220501,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Velifer,GOBP_POSITIVE_REGULATION_OF_OXIDATIVE_STRESS_INDUCED_INTRINSIC_APOPTOTIC_SIGNALING_PATHWAY,0.0004758279,1
2,Myotis-Velifer,GOBP_NUCLEOSIDE_BISPHOSPHATE_CATABOLIC_PROCESS,0.0007613247,1
3,Myotis-Velifer,GOBP_POSITIVE_REGULATION_OF_T_CELL_DIFFERENTIATION_IN_THYMUS,0.0007613247,1
4,Myotis-Velifer,REACTOME_VITAMIN_B5_PANTOTHENATE_METABOLISM,0.0011419871,1
5,Myotis-Velifer,GOBP_COENZYME_A_METABOLIC_PROCESS,0.0012371526,1
6,Myotis-Velifer,GOBP_CHRONIC_INFLAMMATORY_RESPONSE,0.0014274838,1
7,Myotis-Velifer,GOBP_REGULATION_OF_T_CELL_DIFFERENTIATION_IN_THYMUS,0.0015226494,1
8,Myotis-Velifer,GOBP_REGULATION_OF_OXIDATIVE_STRESS_INDUCED_INTRINSIC_APOPTOTIC_SIGNALING_PATHWAY,0.0026646365,1
9,Myotis-Velifer,GOBP_RIBONUCLEOTIDE_CATABOLIC_PROCESS,0.0027598021,1
10,Myotis-Velifer,GOBP_PURINE_CONTAINING_COMPOUND_CATABOLIC_PROCESS,0.0033307956,1


### No significant enrichments in N-1 peaks

## Private peaks

In [22]:
private_peaks <- fread("results/data/shared_promoters_private_peaks.csv", data.table = FALSE)

species <- unique(private_peaks$Species)
                                                                             
private_peak_enrichments <- lapply(species, function(spec){
  
  private_peaks_spec <- private_peaks[private_peaks$Species %in% spec,]
  private_peaks_enrich <- sort(unlist(lapply(sets, fisher_test,
                                             mod = private_peaks_spec$Gene,
                                             all = shared_genes$Gene)))
  return(data.frame(Species = spec,
                    Set = names(private_peaks_enrich), 
                    Pval = private_peaks_enrich,
                    Qval = qvalue(private_peaks_enrich)$qvalues,
                    row.names = NULL))
  
})
names(private_peak_enrichments) <- species

In [6]:
tapply(private_peaks$Gene, private_peaks$Species, "[")

In [10]:
lapply(private_peak_enrichments, head, 10)

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Velifer,LAKE_ADULT_KIDNEY_C18_COLLECTING_DUCT_PRINCIPAL_CELLS_MEDULLA,1.037684e-08,0.00035852
2,Myotis-Velifer,HSIAO_HOUSEKEEPING_GENES,7.196842e-08,0.001243255
3,Myotis-Velifer,LAKE_ADULT_KIDNEY_C19_COLLECTING_DUCT_INTERCALATED_CELLS_TYPE_A_MEDULLA,1.602782e-07,0.00184587
4,Myotis-Velifer,MORF_NPM1,9.186881e-07,0.007935168
5,Myotis-Velifer,LAKE_ADULT_KIDNEY_C8_DECENDING_THIN_LIMB,1.268707e-06,0.008766767
6,Myotis-Velifer,BUSSLINGER_DUODENAL_TRANSIT_AMPLIFYING_CELLS,2.397945e-06,0.013808168
7,Myotis-Velifer,GCM_NPM1,3.62949e-06,0.017914126
8,Myotis-Velifer,LAKE_ADULT_KIDNEY_C7_PROXIMAL_TUBULE_EPITHELIAL_CELLS_S3,6.303039e-06,0.026205168
9,Myotis-Velifer,MORF_ACTG1,7.1659e-06,0.026205168
10,Myotis-Velifer,LAKE_ADULT_KIDNEY_C10_THIN_ASCENDING_LIMB,7.584709e-06,0.026205168

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Volans,GOMF_NITRIC_OXIDE_SYNTHASE_BINDING,6.837965e-05,1
2,Myotis-Volans,MODULE_29,0.0003522728,1
3,Myotis-Volans,KEGG_MEDICUS_PATHOGEN_SARS_COV_2_NSP1_TO_TRANSLATION_INITIATION,0.0005397969,1
4,Myotis-Volans,REACTOME_SARS_COV_1_MODULATES_HOST_TRANSLATION_MACHINERY,0.0006109557,1
5,Myotis-Volans,GOBP_POSITIVE_REGULATION_OF_PROTEIN_SERINE_THREONINE_KINASE_ACTIVITY,0.0006499321,1
6,Myotis-Volans,GOCC_CYTOSOLIC_SMALL_RIBOSOMAL_SUBUNIT,0.0007661441,1
7,Myotis-Volans,MORF_NME2,0.0008327518,1
8,Myotis-Volans,GOBP_CELLULAR_RESPONSE_TO_OXYGEN_CONTAINING_COMPOUND,0.0008638493,1
9,Myotis-Volans,GOBP_CALCIUM_ION_IMPORT_ACROSS_PLASMA_MEMBRANE,0.000938377,1
10,Myotis-Volans,PARK_HSC_MARKERS,0.001228381,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Auriculus,MIR6759_3P,5.628154e-05,1
2,Myotis-Auriculus,chr4q23,6.322844e-05,1
3,Myotis-Auriculus,GSE12845_IGD_POS_VS_NEG_BLOOD_BCELL_DN,0.0003546956,1
4,Myotis-Auriculus,GSE360_L_DONOVANI_VS_M_TUBERCULOSIS_DC_UP,0.0004409767,1
5,Myotis-Auriculus,AIZARANI_LIVER_C23_KUPFFER_CELLS_3,0.0004618226,1
6,Myotis-Auriculus,ZAMORA_NOS2_TARGETS_UP,0.0008692779,1
7,Myotis-Auriculus,AP2ALPHA_01,0.0008857297,1
8,Myotis-Auriculus,GOCC_NUCLEOSOME,0.00129803,1
9,Myotis-Auriculus,TAKAO_RESPONSE_TO_UVB_RADIATION_UP,0.001543443,1
10,Myotis-Auriculus,WANG_RESPONSE_TO_GSK3_INHIBITOR_SB216763_DN,0.002333888,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Yumanensis,KEGG_GLYCINE_SERINE_AND_THREONINE_METABOLISM,8.104139e-05,1
2,Myotis-Yumanensis,YAO_TEMPORAL_RESPONSE_TO_PROGESTERONE_CLUSTER_16,0.0002781043,1
3,Myotis-Yumanensis,MIR5585_3P,0.0003288226,1
4,Myotis-Yumanensis,GSE26495_PD1HIGH_VS_PD1LOW_CD8_TCELL_UP,0.001184874,1
5,Myotis-Yumanensis,GSE1791_CTRL_VS_NEUROMEDINU_IN_T_CELL_LINE_6H_UP,0.001418062,1
6,Myotis-Yumanensis,HP_PERONEAL_MUSCLE_WEAKNESS,0.001712166,1
7,Myotis-Yumanensis,GSE41867_NAIVE_VS_DAY8_LCMV_ARMSTRONG_EFFECTOR_CD8_TCELL_DN,0.001790726,1
8,Myotis-Yumanensis,GSE41867_NAIVE_VS_DAY8_LCMV_EFFECTOR_CD8_TCELL_DN,0.002105969,1
9,Myotis-Yumanensis,GSE12198_CTRL_VS_LOW_IL2_STIM_NK_CELL_DN,0.002238974,1
10,Myotis-Yumanensis,GOBP_GROWTH_INVOLVED_IN_HEART_MORPHOGENESIS,0.002282344,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Occultus,GSE360_DC_VS_MAC_UP,0.0002657569,1
2,Myotis-Occultus,CAGTATT_MIR200B_MIR200C_MIR429,0.0003531187,1
3,Myotis-Occultus,KEGG_PATHOGENIC_ESCHERICHIA_COLI_INFECTION,0.0004104378,1
4,Myotis-Occultus,WP_PATHOGENIC_ESCHERICHIA_COLI_INFECTION,0.0004104378,1
5,Myotis-Occultus,HP_INCREASED_LDL_CHOLESTEROL_CONCENTRATION,0.0004859447,1
6,Myotis-Occultus,GSE24142_EARLY_THYMIC_PROGENITOR_VS_DN3_THYMOCYTE_ADULT_DN,0.0005563402,1
7,Myotis-Occultus,PID_AURORA_B_PATHWAY,0.0006108934,1
8,Myotis-Occultus,HP_HYPERLIPOPROTEINEMIA,0.0006556455,1
9,Myotis-Occultus,NAKAYAMA_FRA2_TARGETS,0.0007019427,1
10,Myotis-Occultus,GCM_PFN1,0.0007019427,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Californicus,GSE32034_LY6C_HIGH_VS_LOW_MONOCYTE_DN,0.0001542467,1
2,Myotis-Californicus,HP_ABNORMALITY_OF_THE_HYPOTHENAR_EMINENCE,0.0003806442,1
3,Myotis-Californicus,GOBP_CELLULAR_RESPONSE_TO_BRAIN_DERIVED_NEUROTROPHIC_FACTOR_STIMULUS,0.0005709392,1
4,Myotis-Californicus,HP_MESOMELIC_LEG_SHORTENING,0.0005709392,1
5,Myotis-Californicus,GOBP_REGULATION_OF_TRANSLATION_AT_SYNAPSE,0.000761216,1
6,Myotis-Californicus,GOBP_NEGATIVE_REGULATION_OF_TRANSLATIONAL_ELONGATION,0.0009514747,1
7,Myotis-Californicus,HP_SMALL_THENAR_EMINENCE,0.0009514747,1
8,Myotis-Californicus,GOBP_TRANSLATIONAL_READTHROUGH,0.0011417153,1
9,Myotis-Californicus,HP_AGENESIS_OF_CENTRAL_INCISOR,0.0011417153,1
10,Myotis-Californicus,GOBP_NEGATIVE_REGULATION_OF_EXCITATORY_POSTSYNAPTIC_POTENTIAL,0.0013319378,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Thysanodes,GOBP_REGULATION_OF_LAMELLIPODIUM_ASSEMBLY,0.0004658246,1
2,Myotis-Thysanodes,GOBP_NEGATIVE_REGULATION_OF_PROTEIN_LOCALIZATION_TO_MEMBRANE,0.0006864106,1
3,Myotis-Thysanodes,GOBP_REGULATION_OF_LAMELLIPODIUM_ORGANIZATION,0.0007480522,1
4,Myotis-Thysanodes,GSE3982_DC_VS_BCELL_DN,0.0007909563,1
5,Myotis-Thysanodes,GOMF_THIOLESTER_HYDROLASE_ACTIVITY,0.0008790731,1
6,Myotis-Thysanodes,GSE4984_UNTREATED_VS_LPS_TREATED_DC_DN,0.0009717089,1
7,Myotis-Thysanodes,GSE8685_IL2_ACT_IL2_STARVED_VS_IL15_ACT_IL2_STARVED_CD4_TCELL_UP,0.0009959898,1
8,Myotis-Thysanodes,GSE15330_MEGAKARYOCYTE_ERYTHROID_PROGENITOR_VS_PRO_BCELL_DN,0.0013473547,1
9,Myotis-Thysanodes,AAAGACA_MIR511,0.0013772116,1
10,Myotis-Thysanodes,GSE14769_UNSTIM_VS_360MIN_LPS_BMDM_DN,0.0014381741,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Lucifugus,GOBP_CENTROSOME_SEPARATION,0.0003899389,1
2,Myotis-Lucifugus,KEGG_OLFACTORY_TRANSDUCTION,0.0006074201,1
3,Myotis-Lucifugus,HP_ABNORMAL_NASOLACRIMAL_SYSTEM_MORPHOLOGY,0.0006074201,1
4,Myotis-Lucifugus,BOSCO_INTERFERON_INDUCED_ANTIVIRAL_MODULE,0.00088484,1
5,Myotis-Lucifugus,GSE24081_CONTROLLER_VS_PROGRESSOR_HIV_SPECIFIC_CD8_TCELL_DN,0.0009181104,1
6,Myotis-Lucifugus,GSE25123_WT_VS_PPARG_KO_MACROPHAGE_IL4_AND_ROSIGLITAZONE_STIM_UP,0.0009483047,1
7,Myotis-Lucifugus,GOCC_NUCLEAR_PORE,0.0009924642,1
8,Myotis-Lucifugus,GSE16450_CTRL_VS_IFNA_12H_STIM_MATURE_NEURON_CELL_LINE_UP,0.0010761123,1
9,Myotis-Lucifugus,BIOCARTA_VEGF_PATHWAY,0.001249112,1
10,Myotis-Lucifugus,GSE41867_LCMV_ARMSTRONG_VS_CLONE13_DAY15_EFFECTOR_CD8_TCELL_UP,0.001489449,1

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Evotis,GOCC_FICOLIN_1_RICH_GRANULE,0.0002231413,1
2,Myotis-Evotis,GSE22886_NAIVE_TCELL_VS_NKCELL_UP,0.0002614244,1
3,Myotis-Evotis,DESCARTES_FETAL_HEART_ELF3_AGBL2_POSITIVE_CELLS,0.0003254018,1
4,Myotis-Evotis,CHIBA_RESPONSE_TO_TSA,0.0003826864,1
5,Myotis-Evotis,SEMENZA_HIF1_TARGETS,0.0003826864,1
6,Myotis-Evotis,WINTER_HYPOXIA_METAGENE,0.0005706805,1
7,Myotis-Evotis,PID_HIF1_TFPATHWAY,0.00073713,1
8,Myotis-Evotis,MAP2K1_TARGET_GENES,0.0011419871,1
9,Myotis-Evotis,MODULE_83,0.0012417525,1
10,Myotis-Evotis,HP_ABNORMAL_MORPHOLOGY_OF_THE_MUSCULATURE_OF_THE_NECK,0.0013646722,1


In [12]:
names(private_peak_enrichments)
library(stringr)

In [14]:
head(df)

Unnamed: 0_level_0,Species,Set,Pval,Qval
Unnamed: 0_level_1,<chr>,<chr>,<dbl>,<dbl>
1,Myotis-Velifer,LAKE_ADULT_KIDNEY_C18_COLLECTING_DUCT_PRINCIPAL_CELLS_MEDULLA,1.037684e-08,0.00035852
2,Myotis-Velifer,HSIAO_HOUSEKEEPING_GENES,7.196842e-08,0.001243255
3,Myotis-Velifer,LAKE_ADULT_KIDNEY_C19_COLLECTING_DUCT_INTERCALATED_CELLS_TYPE_A_MEDULLA,1.602782e-07,0.00184587
4,Myotis-Velifer,MORF_NPM1,9.186881e-07,0.007935168
5,Myotis-Velifer,LAKE_ADULT_KIDNEY_C8_DECENDING_THIN_LIMB,1.268707e-06,0.008766767
6,Myotis-Velifer,BUSSLINGER_DUODENAL_TRANSIT_AMPLIFYING_CELLS,2.397945e-06,0.013808168


In [16]:
## Plot signif. enrichments:

df <- private_peak_enrichments[[1]]
df <- df %>%
  dplyr::filter(Qval < .05) %>%
  dplyr::mutate(
    Set = sapply(gsub("_", " ", Set), strwrap, width = 25)
  )
  
ggplot(df, aes(x = Set, y = -log10(Qval))) +
  geom_bar(stat = "identity") +
  theme_minimal() +
    theme(axis.title.x = element_blank(),
          axis.text.x = element_text(angle = 45, hjust = 1),
          axis.title.y = element_text(margin = margin(r = 15)),
          panel.grid = element_blank(),
          plot.margin = unit(c(4, 6, 4, 6), "cm")) +
    labs(title = "Proportion of transposable elements with peaks") +
    ylab("Proportion")

ERROR while rich displaying an object: [1m[33mError[39m in `geom_bar()`:[22m
[1m[22m[33m![39m Problem while setting up geom.
[36mi[39m Error occurred in the 1st layer.
[1mCaused by error in `abs()`:[22m
[33m![39m non-numeric argument to mathematical function

Traceback:
1. tryCatch(withCallingHandlers({
 .     if (!mime %in% names(repr::mime2repr)) 
 .         stop("No repr_* for mimetype ", mime, " in repr::mime2repr")
 .     rpr <- repr::mime2repr[[mime]](obj)
 .     if (is.null(rpr)) 
 .         return(NULL)
 .     prepare_content(is.raw(rpr), rpr)
 . }, error = error_handler), error = outer_handler)
2. tryCatchList(expr, classes, parentenv, handlers)
3. tryCatchOne(expr, names, parentenv, handlers[[1L]])
4. doTryCatch(return(expr), name, parentenv, handler)
5. withCallingHandlers({
 .     if (!mime %in% names(repr::mime2repr)) 
 .         stop("No repr_* for mimetype ", mime, " in repr::mime2repr")
 .     rpr <- repr::mime2repr[[mime]](obj)
 .     if (is.null(rpr)) 
 

## Semi-private peaks

In [3]:
# tapply(private_peaks$Gene, private_peaks$Species, "[")

In [1]:
# private_peaks <- fread("results/data/shared_promoters_semi_private_peaks.csv", data.table = FALSE)

# all_pairs <- table(private_peaks$Species)

# species <- names(all_pairs)[all_pairs >= 3]

# species <- species                        
# private_peak_enrichments <- lapply(species, function(spec){
  
#   private_peaks_spec <- private_peaks[private_peaks$Species %in% spec,]
#   private_peaks_enrich <- sort(unlist(lapply(sets, fisher_test,
#                                              mod = private_peaks_spec$Gene,
#                                              all = shared_genes$Gene)))
#   return(data.frame(Species = spec,
#                     Set = names(private_peaks_enrich), 
#                     Pval = private_peaks_enrich,
#                     Qval = qvalue(private_peaks_enrich)$qvalues,
#                     row.names = NULL))
  
# })
# names(private_peak_enrichments) <- species

In [2]:
# lapply(private_peak_enrichments, head, 10)