##### Steps for reading in dataset (following download), initial QC, dim reduction/clustering and saving out the myeloid cluster for **GSE184880**

file previously downloaded:
GSE184880_RAW.tar

unzipped using 
``` bash
tar -xvf GSE184880_RAW.tar
```

This gives the following files: 
* GSM5599220_Norm1.barcodes.tsv.gz
* GSM5599220_Norm1.genes.tsv.gz
* GSM5599220_Norm1.matrix.mtx.gz
* GSM5599221_Norm2.barcodes.tsv.gz
* GSM5599221_Norm2.genes.tsv.gz
* GSM5599221_Norm2.matrix.mtx.gz
* GSM5599222_Norm3.barcodes.tsv.gz
* GSM5599222_Norm3.genes.tsv.gz
* GSM5599222_Norm3.matrix.mtx.gz
* GSM5599223_Norm4.barcodes.tsv.gz
* GSM5599223_Norm4.genes.tsv.gz
* GSM5599223_Norm4.matrix.mtx.gz
* GSM5599224_Norm5.barcodes.tsv.gz
* GSM5599224_Norm5.genes.tsv.gz
* GSM5599224_Norm5.matrix.mtx.gz
* GSM5599225_Cancer1.barcodes.tsv.gz
* GSM5599225_Cancer1.genes.tsv.gz
* GSM5599225_Cancer1.matrix.mtx.gz
* GSM5599226_Cancer2.barcodes.tsv.gz
* GSM5599226_Cancer2.genes.tsv.gz
* GSM5599226_Cancer2.matrix.mtx.gz
* GSM5599227_Cancer3.barcodes.tsv.gz
* GSM5599227_Cancer3.genes.tsv.gz
* GSM5599227_Cancer3.matrix.mtx.gz
* GSM5599228_Cancer4.barcodes.tsv.gz
* GSM5599228_Cancer4.genes.tsv.gz
* GSM5599228_Cancer4.matrix.mtx.gz
* GSM5599229_Cancer5.barcodes.tsv.gz
* GSM5599229_Cancer5.genes.tsv.gz
* GSM5599229_Cancer5.matrix.mtx.gz
* GSM5599230_Cancer6.barcodes.tsv.gz
* GSM5599230_Cancer6.genes.tsv.gz
* GSM5599230_Cancer6.matrix.mtx.gz
* GSM5599231_Cancer7.barcodes.tsv.gz
* GSM5599231_Cancer7.genes.tsv.gz
* GSM5599231_Cancer7.matrix.mtx.gz

Files were then organised into seperate folders for each patient and named with correct file names.

In [1]:
#set wd
getwd()
setwd('/scratch/user/s4436039/scdata/GSE184880')
getwd()

In [2]:
#Load packages
library(dplyr)
library(Seurat)
library(patchwork)


Attaching package: ‘dplyr’


The following objects are masked from ‘package:stats’:

    filter, lag


The following objects are masked from ‘package:base’:

    intersect, setdiff, setequal, union


“package ‘Seurat’ was built under R version 4.3.2”
Loading required package: SeuratObject

Loading required package: sp

“package ‘sp’ was built under R version 4.3.2”

Attaching package: ‘SeuratObject’


The following object is masked from ‘package:base’:

    intersect


“package ‘patchwork’ was built under R version 4.3.2”


In [5]:
#load all datasets
OC_Cancer1.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer1")
OC_Cancer2.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer2")
OC_Cancer3.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer3")
OC_Cancer4.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer4")
OC_Cancer5.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer5")
OC_Cancer6.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer6")
OC_Cancer7.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Cancer7")
OC_Norm1.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Norm1")
OC_Norm2.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Norm2")
OC_Norm3.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Norm3")
OC_Norm4.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Norm4")
OC_Norm5.data <- Read10X(data.dir = "/scratch/user/s4436039/scdata/GSE184880/Norm5")

In [9]:
head(colnames(OC_Cancer1.data))

In [11]:
#Add dataset info to colnames
colnames(OC_Cancer1.data) <- paste0("GSE184880_Cancer1_", colnames(OC_Cancer1.data))
colnames(OC_Cancer2.data) <- paste0("GSE184880_Cancer2_", colnames(OC_Cancer2.data))
colnames(OC_Cancer3.data) <- paste0("GSE184880_Cancer3_", colnames(OC_Cancer3.data))
colnames(OC_Cancer4.data) <- paste0("GSE184880_Cancer4_", colnames(OC_Cancer4.data))
colnames(OC_Cancer5.data) <- paste0("GSE184880_Cancer5_", colnames(OC_Cancer5.data))
colnames(OC_Cancer6.data) <- paste0("GSE184880_Cancer6_", colnames(OC_Cancer6.data))
colnames(OC_Cancer7.data) <- paste0("GSE184880_Cancer7_", colnames(OC_Cancer7.data))
colnames(OC_Norm1.data) <- paste0("GSE184880_Norm1_", colnames(OC_Norm1.data))
colnames(OC_Norm2.data) <- paste0("GSE184880_Norm2_", colnames(OC_Norm2.data))
colnames(OC_Norm3.data) <- paste0("GSE184880_Norm3_", colnames(OC_Norm3.data))
colnames(OC_Norm4.data) <- paste0("GSE184880_Norm4_", colnames(OC_Norm4.data))
colnames(OC_Norm5.data) <- paste0("GSE184880_Norm5_", colnames(OC_Norm5.data))

In [12]:
head(colnames(OC_Cancer1.data))
head(colnames(OC_Cancer2.data))
head(colnames(OC_Cancer3.data))
head(colnames(OC_Cancer4.data))
head(colnames(OC_Cancer5.data))
head(colnames(OC_Cancer6.data))
head(colnames(OC_Cancer7.data))
head(colnames(OC_Norm1.data))
head(colnames(OC_Norm2.data))
head(colnames(OC_Norm3.data))
head(colnames(OC_Norm4.data))
head(colnames(OC_Norm5.data))