In [None]:
library(ggplot2)
library(nlme)

In [None]:
df = read.table("cellsize_genomesize.Rin", sep = '\t', header = TRUE)
#df$ploidy <- factor(df$ploidy, levels=c('haploid','unknown low het', 'diploid', 'diploid high het','polyploid'))
df$type <- factor(df$type, levels=c('A','B','C','Unknown'))
typedf = df[,c("strain","type","mbp")]
head(df)

In [None]:
gg = ggplot(data=df, aes(x=median, y=mbp, color=type)) 
gg = gg + geom_point(size=7) 
gg = gg + geom_smooth(method = "lm", alpha = .15, aes(fill = type))
gg = gg + facet_grid(. ~ type, scales = "free")
gg = gg + theme_classic()
gg = gg + labs(x='Cell volume (um^3)', y='DNA content (Mbp)', color='Prymnesin type', shape='Proposed ploidy') 
#gg = gg + scale_y_continuous(breaks=seq(0,900,100))
gg = gg + theme(text = element_text(size=20))
gg = gg + geom_text(label=df$strain, size=4, color='#000000')
gg = gg + scale_color_manual(values=c("#d95f02", "#7570b3", "#1b9e77", "#000000"))
gg = gg + scale_fill_manual(values=c("#d95f02", "#7570b3", "#1b9e77", "#000000"))
gg = gg + scale_shape_manual(values=c(15, 16, 17))
#gg = gg + xlim(50, 140)
# gg = gg + theme(legend.key.size=unit(0.2, "cm")) 
# gg = gg + theme(legend.key.width=unit(0.3, "cm")) 
gg

In [None]:
ggsave('cellsize_genomesize_type.pdf', device = "pdf", width = 10, height = 4, units = "in")

In [None]:
subdf = subset(df, ploidy < 3)

gg = ggplot(data=subdf, aes(x=median, y=mbp, color=factor(ploidy))) 
gg = gg + geom_point(size=7) 
gg = gg + geom_smooth(method = "lm", alpha = .15)
gg = gg + facet_grid(. ~ factor(ploidy), scales = "free")
gg = gg + theme_classic()
gg = gg + labs(x='Cell volume (um^3)', y='DNA content (Mbp)', color='Prymnesin type', shape='Proposed ploidy') 
#gg = gg + scale_y_continuous(breaks=seq(0,900,100))
gg = gg + theme(text = element_text(size=20))
gg = gg + geom_text(label=subdf$strain, size=4, color='#000000')
gg = gg + scale_color_manual(values=c("#d95f02", "#7570b3", "#1b9e77", "#000000"))
gg = gg + scale_fill_manual(values=c("#d95f02", "#7570b3", "#1b9e77", "#000000"))
gg = gg + scale_shape_manual(values=c(15, 16, 17))
#gg = gg + xlim(50, 140)
# gg = gg + theme(legend.key.size=unit(0.2, "cm")) 
# gg = gg + theme(legend.key.width=unit(0.3, "cm")) 
gg

In [None]:
ggsave('cellsize_genomesize_ploidy.pdf', device = "pdf", width = 10, height = 4, units = "in")

In [None]:
bigdf = read.table("../../../figshare/cell_size/cell_volume.txt", sep = '\t', header = TRUE)
bigdf$strain <- factor(bigdf$strain, levels=c('12B1','UTEX2797','CCMP3037','12A1','CCMP2941','RCC3703','K0081','K0374','RCC3426','KAC39','K0252','RCC191','RCC1433','UTEX995','RCC1436'))
# df$ploidy <- factor(df$ploidy, levels=c('haploid','diploid low het','diploid high het','polyploid'))
# df$type <- factor(df$type, levels=c('A','B','C'))

head(bigdf)

In [None]:
bigdf = merge(bigdf, typedf, by = "strain", sort = F, all.x = T)
head(bigdf)

In [None]:
tail(bigdf)

In [None]:
gg = ggplot(data=bigdf, aes(x=strain, y=vol, color=type))
gg = gg + geom_boxplot(outlier.shape = NA)
#gg = gg + geom_violin()
#gg = gg + stat_summary(fun.y=median, geom="point", size=2, color="red")
gg = gg + geom_jitter(width = 0.25, alpha=0.5)
gg = gg + theme_classic()
gg = gg + labs(x=NULL, y='Cell volume (um^3)', color="Prymnesin type") 
gg = gg + theme(axis.text.x = element_text(angle = 90, vjust = 0.5, hjust=1))
gg = gg + theme(text = element_text(size=20))
gg = gg + scale_color_manual(values=c("#d95f02", "#7570b3", "#1b9e77", "#000000"))
# gg = gg + scale_y_continuous(breaks=seq(0,900,100))
# gg = gg + geom_text(label=df$strain, size=4, color='#000000')
# gg = gg + scale_shape_manual(values=c(19, 15, 17, 8))
# gg = gg + xlim(60, 140)

gg

In [None]:
ggsave('cellsize_distribution.pdf', device = "pdf", width = 10, height = 4, units = "in")