GO analysis of WT AZ gene expression etc

In [1]:
library(here)
library(Matrix)
library(tidyverse)
library(Seurat)
library(ggpointdensity)
library(scales)
library(DropletUtils)
library(reticulate)
library(repr)
#library(DoubletFinder)
library(future)
library(RColorBrewer)
library(edgeR)
library(limma)
library(svglite)
#library(PCAtools)
options(future.globals.maxSize = 100000 * 1024^2)

proto_genes=read.csv("../data/bulk_data/protoplasting.csv")
proto_list=as.character(proto_genes[abs(proto_genes$logFC) > 1,]$genes)
bulk_data = read.csv("/home/robotmessenger810/data/buckets/single_cell_bucket_3_4_21/IWT_RNA_seq/scRNA_flowers/outputs/bulk_edger_10_16_20.csv")


In [2]:
seu_intd_wt = readRDS(file = "../data/intd_seu_objects/1_6_22_WT.rds")

In [None]:
#findmarkers
cluster_AZ_all = FindAllMarkers(seu_intd_wt, max.cells.per.ident = 1000)

In [None]:
saveRDS(cluster_AZ_all, file = paste("../data/markers/", "AZ_markers_WT_ALL_res_1_25_Feb_14_22", ".rds", sep=""))

In [None]:
#write AZ specific genes as well as all genes with high enough expression to be included in the analysis (ie the universe of genes for gene set testing)
write.csv(cluster_AZ_all[cluster_AZ_all$cluster == 9,], file = paste("../data/for_figures/", "AZ_spec_genes_universe_WT_res_1_25_Jan_18_22", ".csv", sep=""), row.names = FALSE)
write.csv(unique(cluster_AZ_all$gene), file = paste("../data/for_figures/", "WT_universe_spec_genes_WT_res_1_25_Jan_18_22", ".csv", sep=""), row.names = FALSE)

In [3]:
genes = c("AT3G44540","AT3G44550","AT3G44560","AT5G22500","AT1G53830","AT2G41850","AT2G47550","AT3G07970","AT3G24670","AT3G27400","AT4G24780","AT1G28130","AT2G14960","AT2G16580","AT2G28085","AT2G36210",
          "AT3G07390","AT4G14560","AT4G27260","AT4G28640","AT5G54510")
genes

In [3]:
resolution = 1.25
set.seed(42)
DefaultAssay(seu_intd_wt) <- "integrated"
options(repr.plot.width=12, repr.plot.height=12)
# Run the standard workflow for visualization and clustering
#all_intd_sct <- ScaleData(all_intd_sct, verbose = FALSE)
seu_intd_wt <- RunPCA(seu_intd_wt, npcs = 100, verbose = FALSE, approx = FALSE)
#From RunPCA doc: Features to compute PCA on. If features=NULL, PCA will be run using the variable features for the Assay. 
#Note that the features must be present in the scaled data. Any requested features that are not scaled or have 0 variance 
#will be dropped, and the PCA will be run using the remaining features.

#previously run 20 PCs as of 2/14/22
seu_intd_wt <- FindNeighbors(seu_intd_wt, dims = 1:20, verbose = FALSE)
seu_intd_wt <- FindClusters(seu_intd_wt, resolution = resolution, algorithm = 3, verbose = FALSE)
seu_intd_wt <- RunUMAP(seu_intd_wt, reduction = "pca", dims = 1:20, verbose = FALSE)

“The default method for RunUMAP has changed from calling Python UMAP via reticulate to the R-native UWOT using the cosine metric
To use Python UMAP via reticulate, set umap.method to 'umap-learn' and metric to 'correlation'
This message will be shown once per session”


In [6]:
DefaultAssay(seu_intd_wt) <- "SCT"
options(repr.plot.width=8, repr.plot.height=8)

for (g in genes) {
    plot = FeaturePlot(seu_intd_wt, features = g,  pt.size = 2.25, min = .75, order = TRUE)#, split.by = "experiment")# + scale_colour_gradient(low = "gray94", high = "red", space = "Lab", na.value = "grey50", guide = "colourbar",aesthetics = "colour")
    #print(plot)   
    ggsave(file=paste0("/home/robotmessenger810/sc_analysis/data/for_figures/gene_plots/figure_3_pngs/",g, ".png"), plot=plot, width=10, height=10)
}

In [None]:
DefaultAssay(seu_intd_wt) <- "SCT"
FeaturePlot(seu_intd_wt, features = "AT3G09220",  pt.size = 2.25, min = .75, order = TRUE)