## Estimating doublets on preprocessed data

Import necessary libraries

In [2]:
library(Seurat)
library(dplyr)
library(magrittr)
IRdisplay::display_html("<style> .container { width:95% !important; } </style>")
library("xlsx")

"package 'dplyr' was built under R version 3.6.3"
Attaching package: 'dplyr'

The following objects are masked from 'package:stats':

    filter, lag

The following objects are masked from 'package:base':

    intersect, setdiff, setequal, union

"package 'magrittr' was built under R version 3.6.3"

"package 'xlsx' was built under R version 3.6.3"

## Quick data quality check on each sample

### Control (eYFP)

In [None]:
VTA_YFP.data <-Read10X(data.dir = "D:/scRNAseq/30-453842648/01_analysis/cellranger_count/YFP/raw_feature_bc_matrix")
colnames(VTA_YFP.data) = paste0(colnames(VTA_YFP.data),"VTA_YFP")
VTA_YFP<- CreateSeuratObject(counts = VTA_YFP.data, min.cells = 3, min.features = 200, project = "10X_VTA_stim")
new_barcodes <- gsub("-1","",colnames(VTA_YFP))
VTA_YFP <- RenameCells(VTA_YFP, new.names = new_barcodes)
VTA_YFP@meta.data$stim <- "VTA_YFP"

mito.features <- grep(pattern = "^mt-", x = rownames(x =VTA_YFP), value = TRUE)
percent.mito <- Matrix::colSums(x = GetAssayData(object = VTA_YFP, slot = 'counts')[mito.features, ]) / Matrix::colSums(x = GetAssayData(object = VTA_YFP, slot = 'counts'))
VTA_YFP[['percent.mito']] <- percent.mito

In [None]:
head(VTA_YFP@meta.data)

In [None]:
FeatureScatter(object = VTA_YFP, feature1 = "nCount_RNA", feature2 = "percent.mito",pt.size=0.1) 
hist(VTA_YFP@meta.data$percent.mito,breaks=seq(0,0.7,0.01))
hist(VTA_YFP@meta.data$nCount_RNA,breaks=seq(0,1000000,300),xlim = c(0,8000))

### LH stim

In [None]:
VTA_LH.data <-Read10X(data.dir = "D:/scRNAseq/30-573274809/01_analysis/cellranger_count/LH/raw_feature_bc_matrix")
colnames(VTA_LH.data) = paste0(colnames(VTA_LH.data),"VTA_LH")
VTA_LH<- CreateSeuratObject(counts = VTA_LH.data, min.cells = 3, min.features = 200, project = "10X_VTA_stim")
new_barcodes <- gsub("-1","",colnames(VTA_LH))
VTA_LH <- RenameCells(VTA_LH, new.names = new_barcodes)
VTA_LH@meta.data$stim <- "VTA_LH"

mito.features <- grep(pattern = "^mt-", x = rownames(x =VTA_LH), value = TRUE)
percent.mito <- Matrix::colSums(x = GetAssayData(object = VTA_LH, slot = 'counts')[mito.features, ]) / Matrix::colSums(x = GetAssayData(object =VTA_LH, slot = 'counts'))
VTA_LH[['percent.mito']] <- percent.mito

In [None]:
FeatureScatter(object = VTA_LH , feature1 = "nCount_RNA", feature2 = "percent.mito",pt.size=0.1)
hist(VTA_LH@meta.data$percent.mito,breaks=seq(0,0.7,0.01))
hist(VTA_LH@meta.data$nCount_RNA,breaks=seq(0,1000000,300),xlim = c(0,8000))

### NAc stim

In [None]:
VTA_NAc.data <-Read10X(data.dir = "D:/scRNAseq/30-573274809/01_analysis/cellranger_count/NAc/raw_feature_bc_matrix")
colnames(VTA_NAc.data) = paste0(colnames(VTA_NAc.data),"VTA_NAc")
VTA_NAc<- CreateSeuratObject(counts = VTA_NAc.data, min.cells = 3, min.features = 200, project = "10X_VTA_stim")
new_barcodes <- gsub("-1","",colnames(VTA_NAc))
VTA_NAc <- RenameCells(VTA_NAc, new.names = new_barcodes)
VTA_NAc@meta.data$stim <- "VTA_NAc"

mito.features <- grep(pattern = "^mt-", x = rownames(x =VTA_NAc), value = TRUE)
percent.mito <- Matrix::colSums(x = GetAssayData(object = VTA_NAc, slot = 'counts')[mito.features, ]) / Matrix::colSums(x = GetAssayData(object = VTA_NAc, slot = 'counts'))
VTA_NAc[['percent.mito']] <- percent.mito

In [None]:
FeatureScatter(object = VTA_NAc , feature1 = "nCount_RNA", feature2 = "percent.mito",pt.size=0.1)
hist(VTA_NAc@meta.data$percent.mito,breaks=seq(0,0.7,0.01))
hist(VTA_NAc@meta.data$nCount_RNA,breaks=seq(0,1000000,300),xlim = c(0,8000))

### PFC stim

In [None]:
VTA_PFC.data <-Read10X(data.dir = "D:/scRNAseq/30-573274809/01_analysis/cellranger_count/PFC/raw_feature_bc_matrix")
colnames(VTA_PFC.data) = paste0(colnames(VTA_PFC.data),"VTA_PFC")
VTA_PFC<- CreateSeuratObject(counts = VTA_PFC.data, min.cells = 3, min.features = 200, project = "10X_VTA_stim")
new_barcodes <- gsub("-1","",colnames(VTA_PFC))
VTA_PFC <- RenameCells(VTA_PFC, new.names = new_barcodes)
VTA_PFC@meta.data$stim <- "VTA_PFC"

mito.features <- grep(pattern = "^mt-", x = rownames(x =VTA_PFC), value = TRUE)
percent.mito <- Matrix::colSums(x = GetAssayData(object = VTA_PFC, slot = 'counts')[mito.features, ]) / Matrix::colSums(x = GetAssayData(object = VTA_PFC, slot = 'counts'))
VTA_PFC[['percent.mito']] <- percent.mito

In [None]:
FeatureScatter(object = VTA_PFC , feature1 = "nCount_RNA", feature2 = "percent.mito",pt.size=0.1)
hist(VTA_PFC@meta.data$percent.mito,breaks=seq(0,0.7,0.01))
hist(VTA_PFC@meta.data$nCount_RNA,breaks=seq(0,1000000,300),xlim = c(0,8000))

# Doublet simulation

Data normalization, scaling, and dimensionality reduction

In [None]:
sample<-c("VTA_YFP","VTA_LH","VTA_NAc","VTA_PFC")

In [None]:
VTA_YFP <- subset(x = VTA_YFP, subset = nCount_RNA > 700 & nCount_RNA < 25000 & percent.mito < 0.01) # you may change percent.mito from 0.2 to 0.3 

In [None]:
#VTA_YFP <- subset(x = VTA_YFP, subset = nCount_RNA > 500 & nCount_RNA < 25000 & percent.mito < 0.05) # you may change percent.mito from 0.2 to 0.3 

VTA_YFP<- NormalizeData(object = VTA_YFP,verbose = FALSE) 

VTA_YFP<- FindVariableFeatures(object =VTA_YFP,selection.method = "vst", nfeatures = 2000, verbose = FALSE)

VTA_YFP<- ScaleData(object = VTA_YFP, features = rownames(x =VTA_YFP), vars.to.regress = c("nCount_RNA", "percent.mito"))

VTA_YFP<- RunPCA(object = VTA_YFP, features = VariableFeatures(object =VTA_YFP), verbose = FALSE)

VTA_YFP<- FindNeighbors(object =VTA_YFP, dims = 1:30)
VTA_YFP<- FindClusters(object = VTA_YFP, resolution = 0.8)

saveRDS(VTA_YFP,file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_YFP")

In [None]:
my_data <- read.delim("/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/YFP/counts.txt")

In [None]:
VTA_YFP <- readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_YFP")

In [None]:
VTA_LH <- subset(x = VTA_LH, subset = nCount_RNA > 800 & nCount_RNA < 25000 & percent.mito < 0.01) 

VTA_LH<- NormalizeData(object = VTA_LH,verbose = FALSE) 

VTA_LH<- FindVariableFeatures(object =VTA_LH,selection.method = "vst", nfeatures = 2000, verbose = FALSE)

VTA_LH<- ScaleData(object = VTA_LH, features = rownames(x =VTA_LH), vars.to.regress = c("nCount_RNA", "percent.mito"))

VTA_LH<- RunPCA(object = VTA_LH, features = VariableFeatures(object =VTA_LH), verbose = FALSE)

VTA_LH<- FindNeighbors(object =VTA_LH, dims = 1:30)
VTA_LH<- FindClusters(object = VTA_LH, resolution = 0.8)

saveRDS(VTA_LH,file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_LH")

In [None]:
VTA_LH <- readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_LH")

In [None]:
VTA_NAc <- subset(x = VTA_NAc, subset = nCount_RNA > 800 & nCount_RNA < 25000 & percent.mito < 0.01)

VTA_NAc<- NormalizeData(object = VTA_NAc,verbose = FALSE) 

VTA_NAc<- FindVariableFeatures(object =VTA_NAc,selection.method = "vst", nfeatures = 2000, verbose = FALSE)

VTA_NAc<- ScaleData(object = VTA_NAc, features = rownames(x =VTA_NAc), vars.to.regress = c("nCount_RNA", "percent.mito"))

VTA_NAc<- RunPCA(object = VTA_NAc, features = VariableFeatures(object =VTA_NAc), verbose = FALSE)

VTA_NAc<- FindNeighbors(object =VTA_NAc, dims = 1:30)
VTA_NAc<- FindClusters(object = VTA_NAc, resolution = 0.8)

saveRDS(VTA_NAc,file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_NAc")

In [None]:
VTA_NAc <- readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_NAc")

In [None]:
VTA_PFC <- subset(x = VTA_PFC, subset = nCount_RNA > 900 & nCount_RNA < 25000 & percent.mito < 0.01) # you may change percent.mito from 0.2 to 0.3 
str(VTA_PFC)

In [None]:
VTA_PFC<- NormalizeData(object = VTA_PFC,verbose = FALSE) 

VTA_PFC<- FindVariableFeatures(object =VTA_PFC,selection.method = "vst", nfeatures = 2000, verbose = FALSE)

VTA_PFC<- ScaleData(object = VTA_PFC, features = rownames(x =VTA_PFC), vars.to.regress = c("nCount_RNA", "percent.mito"))

VTA_PFC<- RunPCA(object = VTA_PFC, features = VariableFeatures(object =VTA_PFC), verbose = FALSE)

VTA_PFC<- FindNeighbors(object =VTA_PFC, dims = 1:30)
VTA_PFC<- FindClusters(object = VTA_PFC, resolution = 0.8)

saveRDS(VTA_PFC,file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_PFC")

In [None]:
VTA_PFC <- readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_PFC")

Run UMAP on each sample separately

In [None]:
VTA_YFP <- RunUMAP(VTA_YFP, reduction='pca', dims=1:30)

In [None]:
VTA_LH <- RunUMAP(VTA_LH, reduction='pca', dims=1:30)

In [None]:
VTA_PFC <- RunUMAP(VTA_PFC, reduction='pca', dims=1:30)

In [None]:
VTA_NAc <- RunUMAP(VTA_NAc, reduction='pca', dims=1:30)

In [None]:
str(VTA_PFC)

Re-import files if necessary

In [None]:
VTA_YFP<-readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_YFP")
VTA_LH<-readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_LH")
VTA_NAc<-readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_NAc")
VTA_PFC<-readRDS(file = "/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/VTA_PFC")

In [None]:
counts<-as.matrix(VTA_YFP@assays$RNA@data)
write.table(data.frame("GENE"=rownames(counts),counts),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/YFP/counts.txt",row.names=FALSE,sep="\t")
markers <- FindAllMarkers(object = VTA_YFP, only.pos = TRUE, min.pct = 0.25)
top_50<-markers %>% group_by(cluster) %>% top_n(50)
write.table(data.frame("test"=as.character(rownames(top_50)),top_50),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/YFP/Top50Genes.txt",row.names=FALSE,col.names=c("",colnames(top_50)),sep="\t",eol="\n")
cluster<-Idents(object=VTA_YFP)
cluster<-as.matrix(cluster)
cluster[,1]<-as.character(cluster[,1])
cluster[,0]<-as.character(cluster[,0])
cluster<-data.frame("x"=rownames(cluster),cluster)
write.table(cluster,file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/YFP/Cluster.txt",row.names=FALSE,col.names=c("","x"),sep="\t",eol="\n")

In [None]:
library("DoubletDecon")
location="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/YFP/" #Update as needed 
expressionFile=paste0(location, "counts.txt")
genesFile=paste0(location, "Top50Genes.txt")
clustersFile=paste0(location, "Cluster.txt")

newFiles=Seurat_Pre_Process(expressionFile, genesFile, clustersFile)

results=Main_Doublet_Decon(rawDataFile=newFiles$newExpressionFile, 
                           groupsFile=newFiles$newGroupsFile, 
                           filename="cntl", 
                           location=location,
                           fullDataFile=NULL, 
                           removeCC=FALSE, 
                           species="mmu", 
                           rhop=1.1, 
                           write=TRUE, 
                           PMF=TRUE, 
                           useFull=FALSE, 
                           heatmap=FALSE,
                           centroids=TRUE,
                           num_doubs=100, 
                           only50=TRUE,
                           min_uniq=4)

In [None]:
counts<-as.matrix(VTA_LH@assays$RNA@data)
write.table(data.frame("GENE"=rownames(counts),counts),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/LH/counts.txt",row.names=FALSE,sep="\t")
markers <- FindAllMarkers(object = VTA_LH, only.pos = TRUE, min.pct = 0.25)
top_50<-markers %>% group_by(cluster) %>% top_n(50)
write.table(data.frame("test"=as.character(rownames(top_50)),top_50),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/LH/Top50Genes.txt",row.names=FALSE,col.names=c("",colnames(top_50)),sep="\t",eol="\n")
cluster<-Idents(object=VTA_LH)
cluster<-as.matrix(cluster)
cluster[,1]<-as.character(cluster[,1])
cluster[,0]<-as.character(cluster[,0])
cluster<-data.frame("x"=rownames(cluster),cluster)
write.table(cluster,file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/LH/Cluster.txt",row.names=FALSE,col.names=c("","x"),sep="\t",eol="\n")

In [None]:
library("DoubletDecon")
location="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/LH/" #Update as needed 
expressionFile=paste0(location, "counts.txt")
genesFile=paste0(location, "Top50Genes.txt")
clustersFile=paste0(location, "Cluster.txt")

newFiles=Seurat_Pre_Process(expressionFile, genesFile, clustersFile)

results=Main_Doublet_Decon(rawDataFile=newFiles$newExpressionFile, 
                           groupsFile=newFiles$newGroupsFile, 
                           filename="cntl", 
                           location=location,
                           fullDataFile=NULL, 
                           removeCC=FALSE, 
                           species="mmu", 
                           rhop=1.1, 
                           write=TRUE, 
                           PMF=TRUE, 
                           useFull=FALSE, 
                           heatmap=FALSE,
                           centroids=TRUE,
                           num_doubs=100, 
                           only50=TRUE,
                           min_uniq=4)

In [None]:
counts<-as.matrix(VTA_NAc@assays$RNA@data)
write.table(data.frame("GENE"=rownames(counts),counts),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/NAc/counts.txt",row.names=FALSE,sep="\t")
markers <- FindAllMarkers(object = VTA_NAc, only.pos = TRUE, min.pct = 0.25)
top_50<-markers %>% group_by(cluster) %>% top_n(50)
write.table(data.frame("test"=as.character(rownames(top_50)),top_50),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/NAc/Top50Genes.txt",row.names=FALSE,col.names=c("",colnames(top_50)),sep="\t",eol="\n")
cluster<-Idents(object=VTA_NAc)
cluster<-as.matrix(cluster)
cluster[,1]<-as.character(cluster[,1])
cluster[,0]<-as.character(cluster[,0])
cluster<-data.frame("x"=rownames(cluster),cluster)
write.table(cluster,file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/NAc/Cluster.txt",row.names=FALSE,col.names=c("","x"),sep="\t",eol="\n")

In [None]:
library("DoubletDecon")
location="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/NAc/" #Update as needed 
expressionFile=paste0(location, "counts.txt")
genesFile=paste0(location, "Top50Genes.txt")
clustersFile=paste0(location, "Cluster.txt")

newFiles=Seurat_Pre_Process(expressionFile, genesFile, clustersFile)

results=Main_Doublet_Decon(rawDataFile=newFiles$newExpressionFile, 
                           groupsFile=newFiles$newGroupsFile, 
                           filename="cntl", 
                           location=location,
                           fullDataFile=NULL, 
                           removeCC=FALSE, 
                           species="mmu", 
                           rhop=1.5, 
                           write=TRUE, 
                           PMF=TRUE, 
                           useFull=FALSE, 
                           heatmap=FALSE,
                           centroids=TRUE,
                           num_doubs=100, 
                           only50=TRUE,
                           min_uniq=4)

In [None]:
counts<-as.matrix(VTA_PFC@assays$RNA@data)
write.table(data.frame("GENE"=rownames(counts),counts),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/PFC/counts.txt",row.names=FALSE,sep="\t")
markers <- FindAllMarkers(object = VTA_PFC, only.pos = TRUE, min.pct = 0.25)
top_50<-markers %>% group_by(cluster) %>% top_n(50)
write.table(data.frame("test"=as.character(rownames(top_50)),top_50),file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/PFC/Top50Genes.txt",row.names=FALSE,col.names=c("",colnames(top_50)),sep="\t",eol="\n")
cluster<-Idents(object=VTA_PFC)
cluster<-as.matrix(cluster)
cluster[,1]<-as.character(cluster[,1])
cluster[,0]<-as.character(cluster[,0])
cluster<-data.frame("x"=rownames(cluster),cluster)
write.table(cluster,file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/PFC/Cluster.txt",row.names=FALSE,col.names=c("","x"),sep="\t",eol="\n")

In [None]:
library("DoubletDecon")
location="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing/PFC/" #Update as needed 
expressionFile=paste0(location, "counts.txt")
genesFile=paste0(location, "Top50Genes.txt")
clustersFile=paste0(location, "Cluster.txt")

newFiles=Seurat_Pre_Process(expressionFile, genesFile, clustersFile)

results=Main_Doublet_Decon(rawDataFile=newFiles$newExpressionFile, 
                           groupsFile=newFiles$newGroupsFile, 
                           filename="cntl", 
                           location=location,
                           fullDataFile=NULL, 
                           removeCC=FALSE, 
                           species="mmu", 
                           rhop=1.1, 
                           write=TRUE, 
                           PMF=TRUE, 
                           useFull=FALSE, 
                           heatmap=FALSE,
                           centroids=TRUE,
                           num_doubs=100, 
                           only50=TRUE,
                           min_uniq=4)

## Checking estimated doublet rates

In [3]:
VTA_YFP.data <-Read10X(data.dir = "D:/scRNAseq/30-453842648/01_analysis/cellranger_count/YFP/raw_feature_bc_matrix")
colnames(VTA_YFP.data) = paste0(colnames(VTA_YFP.data),"VTA_YFP")
VTA_YFP<- CreateSeuratObject(counts = VTA_YFP.data, min.cells = 3, min.features = 200, project = "VTA_seq")
new_barcodes <- gsub("-1","",colnames(VTA_YFP))
VTA_YFP <- RenameCells(VTA_YFP, new.names = new_barcodes)
VTA_YFP@meta.data$stim <- "VTA_YFP"

VTA_YFP_clean<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/YFP/Final_nondoublets_groups_cntl.txt"))
VTA_YFP_doublet<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/YFP/Final_doublets_groups_cntl.txt"))
doubletrate_VTA_YFP<-100*length(VTA_YFP_doublet)/(length(VTA_YFP_clean)+length(VTA_YFP_doublet))
doubletrate_VTA_YFP
#AH_clean<-gsub("\\.","-",AH_clean) # for a reason, something weird change occured in the cellbarcode after running double decon and we need to replace comma back to -
VTA_YFP<-subset(x=VTA_YFP,cells=VTA_YFP_clean)

In [5]:
VTA_LH.data <-Read10X(data.dir = "D:/scRNAseq/30-573274809/01_analysis/cellranger_count/LH/raw_feature_bc_matrix")
colnames(VTA_LH.data) = paste0(colnames(VTA_LH.data),"VTA_LH")
VTA_LH<- CreateSeuratObject(counts = VTA_LH.data, min.cells = 3, min.features = 200, project = "VTA_seq")
new_barcodes <- gsub("-1","",colnames(VTA_LH))
VTA_LH <- RenameCells(VTA_LH, new.names = new_barcodes)
VTA_LH@meta.data$stim <- "VTA_LH"

VTA_LH_clean<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/LH/Final_nondoublets_groups_cntl.txt"))
VTA_LH_doublet<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/LH/Final_doublets_groups_cntl.txt"))
doubletrate_VTA_LH<-100*length(VTA_LH_doublet)/(length(VTA_LH_clean)+length(VTA_LH_doublet))
doubletrate_VTA_LH
#AH_clean<-gsub("\\.","-",AH_clean) # for a reason, something weird change occured in the cellbarcode after running double decon and we need to replace comma back to -
VTA_LH<-subset(x=VTA_LH,cells=VTA_LH_clean)

In [7]:
VTA_NAc.data <-Read10X(data.dir = "D:/scRNAseq/30-573274809/01_analysis/cellranger_count/NAc/raw_feature_bc_matrix")
colnames(VTA_NAc.data) = paste0(colnames(VTA_NAc.data),"VTA_NAc")
VTA_NAc<- CreateSeuratObject(counts = VTA_NAc.data, min.cells = 3, min.features = 200, project = "VTA_seq")
new_barcodes <- gsub("-1","",colnames(VTA_NAc))
VTA_NAc <- RenameCells(VTA_NAc, new.names = new_barcodes)
VTA_NAc@meta.data$stim <- "VTA_NAc"

VTA_NAc_clean<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/NAc/Final_nondoublets_groups_cntl.txt"))
VTA_NAc_doublet<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/NAc/Final_doublets_groups_cntl.txt"))
doubletrate_VTA_NAc<-100*length(VTA_NAc_doublet)/(length(VTA_NAc_clean)+length(VTA_NAc_doublet))
doubletrate_VTA_NAc
#AH_clean<-gsub("\\.","-",AH_clean) # for a reason, something weird change occured in the cellbarcode after running double decon and we need to replace comma back to -
VTA_NAc<-subset(x=VTA_NAc,cells=VTA_NAc_clean)

In [9]:
VTA_PFC.data <-Read10X(data.dir = "D:/scRNAseq/30-573274809/01_analysis/cellranger_count/PFC/raw_feature_bc_matrix")
colnames(VTA_PFC.data) = paste0(colnames(VTA_PFC.data),"VTA_PFC")
VTA_PFC<- CreateSeuratObject(counts = VTA_PFC.data, min.cells = 3, min.features = 200, project = "VTA_seq")
new_barcodes <- gsub("-1","",colnames(VTA_PFC))
VTA_PFC <- RenameCells(VTA_PFC, new.names = new_barcodes)
VTA_PFC@meta.data$stim <- "VTA_PFC"

VTA_PFC_clean<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/PFC/Final_nondoublets_groups_cntl.txt"))
VTA_PFC_doublet<-rownames(read.table(file="/Users/stuberadmin/Documents/scRNAseq/Marta_VTA/Doublet_processing_iter1/PFC/Final_doublets_groups_cntl.txt"))
doubletrate_VTA_PFC<-100*length(VTA_PFC_doublet)/(length(VTA_PFC_clean)+length(VTA_PFC_doublet))
doubletrate_VTA_PFC
VTA_PFC<-subset(x=VTA_PFC,cells=VTA_PFC_clean)