# Dot plot of expression of cell type markers in the data

In [1]:
suppressWarnings({suppressMessages({
    library(Seurat) # the main framework for the scRNA-Seq analyses
    library(readxl)
    library(ggplot2)
})})

Loading the data.

In [2]:
hgsoc <- readRDS("HGSOC_CellHashing_noClustering.RDS")

Loading the ovarian cancer markers for different cell types.

In [3]:
celltypes <- as.data.frame(read_xlsx(path = "ovarian_cancer_markers.xlsx"))
genemarkers <- na.omit(unique(unlist(sapply(celltypes$geneSymbolmore1, function(x) strsplit(x = x, split = ",")[[1]]))))

In [4]:
genemarkers

Retrieving only the DMSO expression of the cells, but from the whole object. This is to retain the normalization applied to the whole dataset.

In [5]:
head(hgsoc@meta.data)

Unnamed: 0_level_0,orig.ident,nCount_RNA,nFeature_RNA,percent.mt,percent.rb,Treatment_group,nCount_SCT,nFeature_SCT,S.Score,G2M.Score,Phase,old.ident,model
Unnamed: 0_level_1,<chr>,<dbl>,<int>,<dbl>,<dbl>,<chr>,<dbl>,<int>,<dbl>,<dbl>,<chr>,<fct>,<chr>
JHOS2_AAACCCAAGCAAATCA-1,SeuratProject,16825,4035,3.786033,33.961367,Fedratinib,26237,4020,-0.10758336,-0.24730111,G1,SeuratProject,JHOS2
JHOS2_AAACCCAAGGTCGCCT-1,SeuratProject,11839,3840,21.378495,9.705212,BMS-754807,25099,4281,-0.07747797,0.06673937,G2M,SeuratProject,JHOS2
JHOS2_AAACCCACAGAACATA-1,SeuratProject,25906,5255,5.867367,24.893847,SCH772984,26422,5202,-0.17890319,-0.31373625,G1,SeuratProject,JHOS2
JHOS2_AAACCCAGTCTGTCAA-1,SeuratProject,19029,4382,10.016291,24.105313,TGX-221,25961,4344,-0.19877877,-0.22370447,G1,SeuratProject,JHOS2
JHOS2_AAACCCAGTCTGTGGC-1,SeuratProject,63590,7494,3.21906,27.130052,Ipatasertib,26958,5246,0.86808988,0.14566181,S,SeuratProject,JHOS2
JHOS2_AAACCCAGTTGGACCC-1,SeuratProject,26547,4371,5.08532,38.550495,Ralimetinib,26738,4343,-0.20121598,-0.2512336,G1,SeuratProject,JHOS2


In [6]:
hgsoc@meta.data$treatment_ext <- paste0(hgsoc@meta.data$model, "_", hgsoc@meta.data$Treatment_group)

In [7]:
head(hgsoc@meta.data$treatment_ext)

In [8]:
pdf(file = "DotPlot_cellTypeMarkers_reviewersOnly.pdf", height = 4, width = 15)
DefaultAssay(hgsoc) <- "SCT"
Idents(hgsoc) <- "treatment_ext"
DotPlot(hgsoc, 
        idents = c("JHOS2_DMSO", "PDC1_DMSO", "PDC2_DMSO"), 
        features = na.omit(genemarkers), 
        scale = F) +
ylab("") +
xlab("") + 
geom_point(aes(size = pct.exp), shape = 21, colour="black", stroke = 0.5) +
scale_color_gradient2(low = "blue", mid = "white", high = "red") +
guides(size = guide_legend(title = "% Expression", override.aes = list(shape = 21, colour = "black", fill = "white")))+ 
theme(axis.text.x = element_text(angle = 45, hjust = 1, face = "italic"))
dev.off()

[1m[22mScale for [32mcolour[39m is already present.
Adding another scale for [32mcolour[39m, which will replace the existing scale.


In [9]:
sessionInfo()

R version 4.2.2 (2022-10-31)
Platform: x86_64-conda-linux-gnu (64-bit)
Running under: Rocky Linux 8.8 (Green Obsidian)

Matrix products: default
BLAS/LAPACK: /homedir01/adini22/.conda/envs/cellhashing_analyses/lib/libopenblasp-r0.3.21.so

locale:
 [1] LC_CTYPE=en_US.UTF-8       LC_NUMERIC=C              
 [3] LC_TIME=en_US.UTF-8        LC_COLLATE=en_US.UTF-8    
 [5] LC_MONETARY=en_US.UTF-8    LC_MESSAGES=en_US.UTF-8   
 [7] LC_PAPER=en_US.UTF-8       LC_NAME=C                 
 [9] LC_ADDRESS=C               LC_TELEPHONE=C            
[11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C       

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

other attached packages:
[1] ggplot2_3.4.2      readxl_1.4.1       SeuratObject_4.1.3 Seurat_4.3.0.9002 

loaded via a namespace (and not attached):
  [1] Rtsne_0.16             colorspace_2.1-0       deldir_1.0-6          
  [4] ellipsis_0.3.2         ggridges_0.5.4         IRdisplay_1.1         
