## Make SingleCellExperiment objects to use with scmap

In [6]:
library(scater)
library(SingleCellExperiment)
library(Matrix)

# MCA

In [8]:
#Load the MCA annotated data
cellbarcodes <- read.table("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/MCA/barcodes.tsv")
genenames <- read.table("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/MCA/genes.tsv")
molecules <- Matrix::readMM("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/MCA/mca_mtx.mtx")

In [10]:
#Add genes and barcodes as row and columns on the matrix
rownames(molecules) <- genenames[,1]
colnames(molecules) <- cellbarcodes[,1]

In [11]:
# Load annotation
ann <- read.csv("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/MCA/annotation_for_r.tsv" , header=F, sep = '\t')

V1,V2,V3
Bladder_1.CCATCTAGCGAGTTTAGG,Stromal cell_Dpt high(Bladder),Bladder
Bladder_1.GAGGAGCGCTTGATACAG,Stromal cell_Car3 high(Bladder),Bladder
Bladder_1.CCAGACACAATAGAATTA,Vascular smooth muscle progenitor cell(Bladder),Bladder
Bladder_1.CCGACGGGACATATGGCG,Vascular endothelial cell(Bladder),Bladder
Bladder_1.TAGCATTCAAAGATTCCA,Urothelium(Bladder),Bladder
Bladder_1.CTCCATCCATCTTTTAGG,Smooth muscle cell(Bladder),Bladder


In [12]:
#Make sure that annotations are correctly ordered
ann_subset <- ann[match(colnames(molecules), ann[,1]),]
celltype <- ann_subset[,2]
tissue <- ann_subset[,3]

In [16]:
#Make annotation dataframe
cell_anns <- data.frame(type=celltype, tissue = tissue)
rownames(cell_anns) <- colnames(molecules);

In [17]:
head(cell_anns)

Unnamed: 0,type,tissue
Bladder_1.CCATCTAGCGAGTTTAGG,Stromal cell_Dpt high(Bladder),Bladder
Bladder_1.GAGGAGCGCTTGATACAG,Stromal cell_Car3 high(Bladder),Bladder
Bladder_1.CCAGACACAATAGAATTA,Vascular smooth muscle progenitor cell(Bladder),Bladder
Bladder_1.CCGACGGGACATATGGCG,Vascular endothelial cell(Bladder),Bladder
Bladder_1.TAGCATTCAAAGATTCCA,Urothelium(Bladder),Bladder
Bladder_1.CTCCATCCATCTTTTAGG,Smooth muscle cell(Bladder),Bladder


In [18]:
#Make singlecellexperiment
molecules <- as.matrix(molecules)
sce_mca <- SingleCellExperiment(assays = list(counts = as.matrix(molecules)), colData=cell_anns)

In [19]:
sce_mca

class: SingleCellExperiment 
dim: 39855 233994 
metadata(0):
assays(1): counts
rownames(39855): 0610007P14Rik 0610009B22Rik ... Krtap4-7 RP23-353P23.2
rowData names(0):
colnames(233994): Bladder_1.CCATCTAGCGAGTTTAGG
  Bladder_1.GAGGAGCGCTTGATACAG ... Uterus_2.AGTTTACCGACGGGGCGA
  Uterus_2.AATAAATGCGGAAGTTTA
colData names(2): type tissue
reducedDimNames(0):
spikeNames(0):

In [20]:
#save to disk
saveRDS(sce_mca, "/gpfs/gss1/work/sduknn/Andreas/TM_MCA/MCA/mca_sce.rds")

# TM - 10X 

In [21]:
#Load the TM - 10x annotated data
cellbarcodes <- read.table("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/droplet/barcodes.tsv")
genenames <- read.table("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/droplet/genes.tsv")
molecules <- Matrix::readMM("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/droplet/droplet_mtx.mtx")

In [23]:
#Add genes and barcodes as row and columns on the matrix
rownames(molecules) <- genenames[,1]
colnames(molecules) <- cellbarcodes[,1]

In [24]:
# Load annotation
ann <- read.csv("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/droplet/annotation_for_r.tsv" , header=F, sep = '\t')

V1,V2,V3
10X_P4_0_AAACCTGAGATTACCC,basal cell of epidermis,Tongue
10X_P4_0_AAACCTGAGTGCCAGA,keratinocyte,Tongue
10X_P4_0_AAACCTGCAAATCCGT,keratinocyte,Tongue
10X_P4_0_AAACCTGGTAATCGTC,basal cell of epidermis,Tongue
10X_P4_0_AAACCTGGTCCAACTA,basal cell of epidermis,Tongue
10X_P4_0_AAACCTGGTGATAAAC,basal cell of epidermis,Tongue


In [25]:
#Make sure that annotations are correctly ordered
ann_subset <- ann[match(colnames(molecules), ann[,1]),]
celltype <- ann_subset[,2]
tissue <- ann_subset[,3]

In [27]:
#Make annotation dataframe
cell_anns <- data.frame(type=celltype, tissue = tissue)
rownames(cell_anns) <- colnames(molecules);

In [28]:
head(cell_anns)

Unnamed: 0,type,tissue
10X_P4_0_AAACCTGAGATTACCC,basal cell of epidermis,Tongue
10X_P4_0_AAACCTGAGTGCCAGA,keratinocyte,Tongue
10X_P4_0_AAACCTGCAAATCCGT,keratinocyte,Tongue
10X_P4_0_AAACCTGGTAATCGTC,basal cell of epidermis,Tongue
10X_P4_0_AAACCTGGTCCAACTA,basal cell of epidermis,Tongue
10X_P4_0_AAACCTGGTGATAAAC,basal cell of epidermis,Tongue


In [29]:
#Make singlecellexperiment
molecules <- as.matrix(molecules)
sce_droplet <- SingleCellExperiment(assays = list(counts = as.matrix(molecules)), colData=cell_anns)

In [30]:
sce_droplet

class: SingleCellExperiment 
dim: 23433 70118 
metadata(0):
assays(1): counts
rownames(23433): 0610005C13Rik 0610007C21Rik ... l7Rn6
  zsGreen_transgene
rowData names(0):
colnames(70118): 10X_P4_0_AAACCTGAGATTACCC 10X_P4_0_AAACCTGAGTGCCAGA
  ... 10X_P8_15_TTTGTCATCTTACCGC 10X_P8_15_TTTGTCATCTTGTTTG
colData names(2): type tissue
reducedDimNames(0):
spikeNames(0):

In [31]:
#save to disk
saveRDS(sce_droplet, "/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/droplet/droplet_sce.rds")

# TM - SS2

In [32]:
#Load the TM - SS2 annotated data
cellbarcodes <- read.table("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/facs/barcodes.tsv")
genenames <- read.table("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/facs/genes.tsv")
molecules <- Matrix::readMM("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/facs/facs_mtx.mtx")

In [34]:
#Add genes and barcodes as row and columns on the matrix
rownames(molecules) <- genenames[,1]
colnames(molecules) <- cellbarcodes[,1]

In [35]:
# Load annotation
ann <- read.csv("/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/facs/annotation_for_r.tsv" , header=F, sep = '\t')


V1,V2,V3
A1.B000126.3_39_F.1.1,epidermal cell,Skin
A1.B000127.3_38_F.1.1,endothelial cell,Fat
A1.B000167.3_56_F.1.1,basal cell,Mammary_Gland
A1.B000168.3_57_F.1.1,,Mammary_Gland
A1.B000412.3_56_F.1.1,endothelial cell,Heart
A1.B000610.3_56_F.1.1,bladder cell,Bladder


In [36]:
#Make sure that annotations are correctly ordered
ann_subset <- ann[match(colnames(molecules), ann[,1]),]
celltype <- ann_subset[,2]
tissue <- ann_subset[,3]

In [38]:
#Make annotation dataframe
cell_anns <- data.frame(type=celltype, tissue = tissue)
rownames(cell_anns) <- colnames(molecules);

In [39]:
head(cell_anns)

Unnamed: 0,type,tissue
A1.B000126.3_39_F.1.1,epidermal cell,Skin
A1.B000127.3_38_F.1.1,endothelial cell,Fat
A1.B000167.3_56_F.1.1,basal cell,Mammary_Gland
A1.B000168.3_57_F.1.1,,Mammary_Gland
A1.B000412.3_56_F.1.1,endothelial cell,Heart
A1.B000610.3_56_F.1.1,bladder cell,Bladder


In [40]:
#Make singlecellexperiment
molecules <- as.matrix(molecules)
sce_facs <- SingleCellExperiment(assays = list(counts = as.matrix(molecules)), colData=cell_anns)

In [41]:
sce_facs

class: SingleCellExperiment 
dim: 23433 53760 
metadata(0):
assays(1): counts
rownames(23433): 0610005C13Rik 0610007C21Rik ... l7Rn6
  zsGreen_transgene
rowData names(0):
colnames(53760): A1.B000126.3_39_F.1.1 A1.B000127.3_38_F.1.1 ...
  P9.MAA001892.3_38_F.1.1 P9.MAA001894.3_39_F.1.1
colData names(2): type tissue
reducedDimNames(0):
spikeNames(0):

In [42]:
#save to disk
saveRDS(sce_facs, "/gpfs/gss1/work/sduknn/Andreas/TM_MCA/TM/facs/facs_sce.rds")