# Purpose

Compare genes of Total and Unique counts 

# Steps


1) import data from various CSV files created
2) Scatterplot between Total vs Unique counts of FDR,Mean,Coefficients

# Conclusions

1) Interesting Patterns especially in heat shock and can treatments 
2) Unique counts FDR values inflated


In [1]:
# NOTEBOOK

In [2]:
#Required Packages 

In [5]:
suppressMessages(require(reshape))
suppressMessages(library(gridExtra))
suppressMessages(library(RColorBrewer))
options(repr.plot.width=5, repr.plot.height=5)
suppressMessages(library(ggpubr))
suppressMessages(library(tidyverse))
library("IRdisplay")
library("egg")
library("grid")
library("OCplus")

In [6]:
TC_files <- list.files("../../reports/production1_2_3_4_5//mid//TC_fdr_csv",pattern='*effect.csv',full.names = TRUE)
UC_files <- list.files("../../reports/production1_2_3_4_5//mid//UC_fdr_csv",pattern='*effect.csv',full.names = TRUE)

In [7]:
length(TC_files)

In [8]:
for (i in 1:length(TC_files))
{
    tryCatch({
condition <- tail(str_split(TC_files,"/|.csv")[[i]],n=2)
tdf <-  read.table(TC_files[i],header=T,sep=",")%>%dplyr::select(fdr,log2_coefficient,locus_tag,mean,controlmean)
udf <- read.table(UC_files[i],header=T,sep=",")%>%dplyr::select(fdr,log2_coefficient,locus_tag,mean,controlmean)
df <- na.omit(merge(tdf, udf, by = "locus_tag", all = TRUE))
colnames(df)<- c("locus_tag","Total.fdr","Total.coefficient","Total.mean","Total.Control.Mean","Unique.fdr","Unique.coefficient","Unique.mean","Unique.Control.Mean")
dfplot1<- df%>%mutate(fdr = case_when(Unique.fdr  < 0.05  ~ "Unique_sig" ))
dfplot2<- df%>%mutate(fdr = case_when(Total.fdr < 0.05  ~ "Total_sig" ))
dfplot3<- df%>%mutate(fdr = case_when(Total.fdr > 0.05 & Unique.fdr  > 0.05  ~ "ns" ))
dfplot <- rbind(dfplot1,dfplot2,dfplot3)%>%drop_na()
dfplot <- dfplot%>%mutate(pointsize = case_when(fdr == "ns" | fdr == "ns"~ "1" ,fdr == "Total_sig" | fdr == "Unique_sig"~ "1"))
p <- ggplot(dfplot,aes(Total.coefficient,Unique.coefficient))+ geom_point(aes(shape=fdr, color=fdr,size=pointsize))+xlab("Total Counts Coefficient")+ylab("Unique Counts Coefficient")+theme_bw()+theme(axis.line = element_line(colour = "black"),
    panel.grid.major = element_blank(),
    panel.grid.minor = element_blank(),
    panel.border = element_blank(),
    panel.background = element_blank())+ggtitle(condition)+scale_shape_manual(labels = c("Not Significant","Unique Significant", "Total Significant"),values = c("ns" = 16,"Unique_sig"=6,"Total_sig"=2))+scale_color_manual(labels = c("Not Significant","Unique Significant", "Total Significant"),values = c("ns" = "azure3","Unique_sig"="darkblue","Total_sig"="darkred"))+guides(size = FALSE)+xlim(-5,5)+ylim(-5,5)+theme(legend.title=element_blank())+ theme(legend.justification = "top")+theme(plot.title = element_text(size=24))+theme(legend.text=element_text(size=18))+theme(axis.text=element_text(size=18),axis.title.y = element_text(size =1, angle = 90))+
theme(aspect.ratio=1)+theme_article()+theme(panel.border = element_blank(),axis.line    = element_line(color='black'))
write_csv(dfplot2%>%filter(fdr=="Total_sig"),paste0("../../reports/production1_2_3//mid/sig_locus/total_sig/TC_",condition, "_sig.csv")[1])
write_csv(dfplot1%>%filter(fdr=="Unique_sig"),paste0("../../reports/production1_2_3//mid/sig_locus/unique_sig/UC_",condition, "_sig.csv")[1])
dfb<- arrange(df%>%filter(Unique.fdr  < 0.05 & Total.fdr < 0.05),Total.fdr,Unique.fdr)
write_csv(dfb,paste0("../../reports/production1_2_3_4_5///mid/sig_locus/both_sig/",condition, "_sig.csv")[1])
ggsave(filename = paste0("../../reports/production1_2_3_4_5///mid/sig_locus/both_sig/",condition, "_figure.pdf")[1], device = "pdf",  plot = p, width = 7, height = 7, dpi = 300, units = "in")
}, error=function(e){})
}



"`guides(<scale> = FALSE)` is deprecated. Please use `guides(<scale> = "none")` instead."
"Using size for a discrete variable is not advised."
"`guides(<scale> = FALSE)` is deprecated. Please use `guides(<scale> = "none")` instead."
"Using size for a discrete variable is not advised."
"`guides(<scale> = FALSE)` is deprecated. Please use `guides(<scale> = "none")` instead."
"Using size for a discrete variable is not advised."
"`guides(<scale> = FALSE)` is deprecated. Please use `guides(<scale> = "none")` instead."
"Using size for a discrete variable is not advised."
"`guides(<scale> = FALSE)` is deprecated. Please use `guides(<scale> = "none")` instead."
"Using size for a discrete variable is not advised."
"Removed 1 rows containing missing values (geom_point)."
"`guides(<scale> = FALSE)` is deprecated. Please use `guides(<scale> = "none")` instead."
"Using size for a discrete variable is not advised."
"Removed 1 rows containing missing values (geom_point)."
"`guides(<scale> = FALSE)` i