In [86]:
library(here)
library(Matrix)
library(tidyverse)
library(Seurat)
library(ggpointdensity)
library(scales)
library(reticulate)
library(repr)
#library(DoubletFinder)
library(future)
library(RColorBrewer)
library(edgeR)
library(limma)
#library(PCAtools)
options(future.globals.maxSize = 100000 * 1024^2)
source(here("R_functions","edgeR_function.R"))

annotations = read.csv("R_functions/gene_descriptions.csv", header = F)
colnames(annotations) = c("gene_id", "description")
annotations$gene_id = substr(annotations$gene_id, 1, 9)

proto_genes=read.csv("../data/bulk_data/protoplasting.csv")
proto_list=as.character(proto_genes[abs(proto_genes$logFC) > 1,]$genes)
bulk_data = read.csv("/home/robotmessenger810/data/buckets/single_cell_bucket_3_4_21/IWT_RNA_seq/scRNA_flowers/outputs/bulk_edger_10_16_20.csv")


In [2]:
seu_intd_wt = readRDS(file = "../data/seurat_objects/seurat_WT_intd_2_17_21.rds")
seu_intd_mut = readRDS(file = "../data/seurat_objects/seurat_mut_intd_label_transferred_3_10_22.rds")

In [3]:
cluster = "9"
seu_intd_wt@active.assay = "RNA"

wt_1_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_wt, subset = orig.ident == "sc_26_combined"), slot = "counts")[, WhichCells(subset(seu_intd_wt, subset = orig.ident == "sc_26_combined"), ident = cluster)]))
wt_2_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_wt, subset = orig.ident == "sc_67"), slot = "counts")[, WhichCells(subset(seu_intd_wt, subset = orig.ident == "sc_67"), ident = cluster)]))
YFP_1_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_wt, subset = orig.ident == "sc_101"), slot = "counts")[, WhichCells(subset(seu_intd_wt, subset = orig.ident == "sc_101"), ident = cluster)]))
YFP_2_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_wt, subset = orig.ident == "sc_103"), slot = "counts")[, WhichCells(subset(seu_intd_wt, subset = orig.ident == "sc_103"), ident = cluster)]))



In [4]:
cluster = "11"
seu_intd_mut@active.assay = "RNA"

mut_1_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_mut, subset = orig.ident == "sc_27_combined"), slot = "counts")[, WhichCells(subset(seu_intd_mut, subset = orig.ident == "sc_27_combined"), ident = cluster)]))
mut_2_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_mut, subset = orig.ident == "sc_68"), slot = "counts")[, WhichCells(subset(seu_intd_mut, subset = orig.ident == "sc_68"), ident = cluster)]))
KE_1_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_mut, subset = orig.ident == "sc_102"), slot = "counts")[, WhichCells(subset(seu_intd_mut, subset = orig.ident == "sc_102"), ident = cluster)]))
KE_2_AZ <- rowSums(as.matrix(GetAssayData(subset(seu_intd_mut, subset = orig.ident == "sc_104"), slot = "counts")[, WhichCells(subset(seu_intd_mut, subset = orig.ident == "sc_104"), ident = cluster)]))


In [5]:
gene_intersection = intersect(names(wt_1_AZ), names(mut_1_AZ))
wt_1_AZ = wt_1_AZ[gene_intersection]
wt_2_AZ = wt_2_AZ[gene_intersection]
YFP_1_AZ = YFP_1_AZ[gene_intersection]
YFP_2_AZ = YFP_2_AZ[gene_intersection]
mut_1_AZ = mut_1_AZ[gene_intersection]
mut_2_AZ = mut_2_AZ[gene_intersection]
KE_1_AZ = KE_1_AZ[gene_intersection]
KE_2_AZ = KE_2_AZ [gene_intersection]

In [19]:
pb_df = data.frame(cbind(wt_1_AZ , wt_2_AZ, YFP_1_AZ, YFP_2_AZ, mut_1_AZ , mut_2_AZ, KE_1_AZ, KE_2_AZ))
colnames(pb_df) = c("WT1", "WT2", "YFP1", "YFP2", "mut1", "mut2", "KE1", "KE2")
rownames(pb_df) = gene_intersection

In [15]:
write.csv(pb_df, "../data/pseudo_bulk_data/AZ_pbs_2_18_22.csv")

In [24]:
pb_df = read.csv("../data/pseudo_bulk_data/AZ_pbs_2_18_22.csv")
rownames(pb_df) = pb_df[,1]
pb_df[,1] <- NULL

In [32]:
#put experimental covariates in
bulk_edger_1 =  edgeR_2_sample(pb_df, "WT", "mut", c(1,2,3,4), c(5,6,7,8), annotations)

In [79]:
bulk_edger_2 = edgeR_2_sample_other_factors(pb_df, "WT", "mut", c(1,2,3,4), c(5,6,7,8), annotations)

In [44]:
WT_higher_1 = bulk_edger_1[bulk_edger_1$FDR < .2 & bulk_edger_1$logFC > 1,]
WT_lower_1 = bulk_edger_1[bulk_edger_1$FDR < .2 & bulk_edger_1$logFC < -1,]

In [94]:
write.csv(bulk_edger_2, "../data/pseudo_bulk_data/AZ_edger_2_18_22_factors.csv")