# Shotgun

In [3]:
# Libraries
library(tidyverse)
library(ROBITools)
library(reshape2)
library(vegan)
library(ggalt)
library(ggpubr)
library(ggrepel)

In [4]:
# Datasets
shotgun_taxa_count <- read.delim("GenomeDK_LCA/counts.lca.rarefy.tsv")
shotgun_eu <- shotgun_taxa_count %>% filter(superkingdom == "Eukaryota")

In [None]:
col <- c(rep("#F8766D",3), rep("#B79F00",3), rep("#00BF7D",3), rep("#00B0F6",3), rep("#E76BF3",3))

**Rarefaction**

In [None]:
# All identified taxa rarecurve
sc <- shotgun_taxa_count[,c(9:23)]
sc <- t(sc)
colnames(sc) <- paste("tax", 1:ncol(sc), sep="")

In [None]:
# This one does not make sense if we do not trust the identifications
png("GenomeDK_LCA/rarefied_curve.all.png", width=2000, height=2000, res=300)
rarecurve(sc, step = 20, col = col, cex = 0.6)
dev.off()

In [None]:
# Phylum rarecurve
sc_phyl <- shotgun_taxa_count[,c(3,9:23)] %>% melt() %>% group_by(phylum, variable) %>%
summarise(value = sum(value)) %>% drop_na(phylum) %>% dcast(variable~phylum)
rownames(sc_phyl) <- sc_phyl$variable
sc_phyl <- sc_phyl[,-1]
sc_phyl <- as.matrix(sc_phyl)

In [None]:
png("GenomeDK_LCA/rarefied_curve.phyla_noNA.png", width=2000, height=2000, res=300)
rarecurve(sc_phyl, step = 20, col = col, cex = 0.6, ylab="Phylum")
dev.off()

**Accumulation**

In [None]:
# Phylum
accum <- specaccum(sc_phyl, method = "exact", permutations = 100, conditioned =TRUE, gamma = "jack1", w = NULL)
accum2 <- specaccum(sc_phyl, "random")
png("GenomeDK_LCA/accum_curve.phyla_noNA.png", width=2000, height=2000, res=300)
plot(accum, ci.type="poly", col="black", lwd=2, ci.lty=0, ci.col="royalblue",xlab="No. of samples",ylab="No. of Phyla",main="Shotgun")
boxplot(accum2, col="gray", add=TRUE, pch="+")
dev.off()