# RNA-sequencing Data Visualisation

*Science Park Study Group (07/05/19)* 
<span style="font-size:smaller;"><span style="font-size:smaller;">Fred White & Susanne Wilken

In [None]:
install.packages("ggplot2")
install.packages("pheatmap")
source("https://bioconductor.org/biocLite.R")
biocLite("DESeq2")

## Part 1 Preprocessing

In [None]:
library(ggplot2)
suppressMessages(library(DESeq2, quietly = T))

In [None]:
#counts <- read.table("C:/Users/world/RNAvis/counts.txt", header = T)
counts <- read.table("https://raw.githubusercontent.com/Fred-White94/RNAseqDataVis/master/data/counts.txt", sep = "\t", header = T)


In [None]:
counts[1:5,1:5]

In [None]:
dim(counts)

In [None]:
head(counts)

In [None]:
sampleinfo <- data.frame(cbind(c("Control_1","Control_2","Control_3","Drought_1","Drought_2","Drought_3"),c(rep("Control",3),rep("Drought",3))), stringsAsFactors = F)
colnames(sampleinfo) <- c("SampleName","Condition")

In [None]:
sampleinfo

## Part 2 DESeq2 and PCA plot

### PCA

In [None]:
counts4DE <- counts[,7:12]
colnames(counts4DE) <- sampleinfo[,1]

In [None]:
head(counts4DE)

In [None]:
PCD <- prcomp(t(counts4DE), center = T)

In [None]:
plot(PCD$x, pch = 20, col = as.factor(sampleinfo$Condition))

In [None]:
DES <- DESeqDataSetFromMatrix(counts4DE, sampleinfo, ~ Condition)

In [None]:
DES

In [None]:
DES <- DESeq(DES, parallel = T)

In [None]:
res <- results(DES, contrast = c("Condition","Control","Drought"))

In [None]:
res

In [None]:
length(which(!(is.na(res$padj))))

In [None]:
plotDispEsts(DES)

In [None]:
plotMA(res, main = "Control and Drought Differences in Gene Expression")

In [None]:
res <- cbind(counts$Geneid, res)

In [None]:
resordered <- res[order(res$padj),]
head(resordered)



**_Get rid of all NA adjusted p-values_**

In [None]:
resordered <- resordered[!is.na(resordered$padj),]
dim(resordered)

In [None]:
install.packages("pheatmap", repos = "https://cloud.r-project.org/")

In [None]:
library(pheatmap)

In [None]:
dim(counts[which(counts$Geneid %in% resordered$'counts$Geneid'),])

In [None]:
FC <- counts[which(counts$Geneid %in% resordered$'counts$Geneid'),]
dim(FC)

In [None]:
head(FC)

In [None]:
resordered


In [None]:
FCf <- counts[which(counts$Geneid %in% resordered[1:25,]$'counts$Geneid'),]
dim(FCf)

In [None]:
colnames(FCf)[2:7] <- sampleinfo$SampleName
head(FCf)

In [None]:
rownames(FCf) <- FCf$Geneid

In [None]:
ScaledCounts <- t(scale(t(FCf[,2:7]), scale = T))

In [None]:
pheatmap(ScaledCounts)