# Question: What are the number of Upregulated and Downregulated Genes from the DESeq2 output from Galaxy?
## Only Retina Data was run on Galaxy.

In [12]:
def extract_significant_genes(filename, output_prefix, p_value_threshold, log2_fc_threshold):
    
    inputfile = open(filename, "r")
    
    upreg_genes = open(output_prefix + "_upregulated.txt", "w")
    downreg_genes = open(output_prefix + "_downregulated.txt", "w")
    all_significant_genes = open(output_prefix + "_all.txt", "w")
    

    for line in inputfile:
        
            
        fields = line.split()
        

        gene_id = fields[0]
        logFC = fields[2]
        p_val_adj = fields[6]
            
        # Skip line if it doesn't have values
        if logFC == "NA" or p_val_adj == "NA": 
            continue
                
        else: 
            logFC = float(logFC)
            p_val_adj = float(p_val_adj)
        
        
        if p_val_adj < p_value_threshold:
            if logFC >= log2_fc_threshold:         
                upreg_genes.write(gene_id + "\n")
                all_significant_genes.write(gene_id + "\n")
            elif logFC <= -log2_fc_threshold: 
                downreg_genes.write(gene_id + "\n")
                all_significant_genes.write(gene_id + "\n")
                
    inputfile.close()
    upreg_genes.close()
    downreg_genes.close()
    all_significant_genes.close()
        

In [22]:
def quantify_results(glds):
    
    # File Names
    all_genes_deseq2 = glds + "_all.txt"
    upreg_genes_deseq2 = glds + "_upregulated.txt"
    downreg_genes_deseq2 = glds + "_downregulated.txt"
     
    print "~~~DESeq2 Results~~~"
    print "Number of DE Genes: "
    !wc -l $all_genes_deseq2
    print "Number of Upregulated Genes: "
    !wc -l $upreg_genes_deseq2
    print "Number of Downregulated Genes: "
    !wc -l $downreg_genes_deseq2
    print ""
    

In [40]:
p_value = 0.05
log_fc = 0

## 7 days, Retina, Galaxy

In [41]:
prefix = "7day_radiation_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/7day/Galaxy22-[DESeq2_result_file_on_Radiation1_vs_Control1].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

prefix = "7day_unloaded_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/7day/Galaxy25-[DESeq2_result_file_on_Unloaded1_vs_Control1].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

prefix = "7day_combination_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/7day/Galaxy28-[DESeq2_result_file_on_Combination1_vs_Control1].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

~~~DESeq2 Results~~~
Number of DE Genes: 
     769 7day_radiation_retina_galaxy_all.txt
Number of Upregulated Genes: 
     332 7day_radiation_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
     437 7day_radiation_retina_galaxy_downregulated.txt

~~~DESeq2 Results~~~
Number of DE Genes: 
     230 7day_unloaded_retina_galaxy_all.txt
Number of Upregulated Genes: 
     112 7day_unloaded_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
     118 7day_unloaded_retina_galaxy_downregulated.txt

~~~DESeq2 Results~~~
Number of DE Genes: 
       0 7day_combination_retina_galaxy_all.txt
Number of Upregulated Genes: 
       0 7day_combination_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
       0 7day_combination_retina_galaxy_downregulated.txt



## 1 Month, Retina, Galaxy

In [32]:
prefix = "1month_radiation_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/1month/Galaxy21-[DESeq2_result_file_on_Radiation2_vs_Control2].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

prefix = "1month_unloaded_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/1month/Galaxy24-[DESeq2_result_file_on_Unloaded2_vs_Control2].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

prefix = "1month_combination_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/1month/Galaxy27-[DESeq2_result_file_on_Combination2_vs_Control2].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

~~~DESeq2 Results~~~
Number of DE Genes: 
      27 1month_radiation_retina_galaxy_all.txt
Number of Upregulated Genes: 
      15 1month_radiation_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
      12 1month_radiation_retina_galaxy_downregulated.txt

~~~DESeq2 Results~~~
Number of DE Genes: 
      13 1month_unloaded_retina_galaxy_all.txt
Number of Upregulated Genes: 
       8 1month_unloaded_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
       5 1month_unloaded_retina_galaxy_downregulated.txt

~~~DESeq2 Results~~~
Number of DE Genes: 
      70 1month_combination_retina_galaxy_all.txt
Number of Upregulated Genes: 
      49 1month_combination_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
      21 1month_combination_retina_galaxy_downregulated.txt



## 4 Month, Retina, Galaxy

In [33]:
prefix = "4month_radiation_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/4month/Galaxy19-[DESeq2_result_file_on_Radiation3_vs_Control3].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

prefix = "4month_unloaded_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/4month/Galaxy22-[DESeq2_result_file_on_Unloaded3_vs_Control3].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

prefix = "4month_combination_retina_galaxy"
inputfile = "../../DESeq2_Output/Retina/4month/Galaxy25-[DESeq2_result_file_on_Combination3_vs_Control3].tabular"
extract_significant_genes(inputfile, prefix, p_value, log_fc)
quantify_results(prefix)

~~~DESeq2 Results~~~
Number of DE Genes: 
       3 4month_radiation_retina_galaxy_all.txt
Number of Upregulated Genes: 
       1 4month_radiation_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
       2 4month_radiation_retina_galaxy_downregulated.txt

~~~DESeq2 Results~~~
Number of DE Genes: 
       1 4month_unloaded_retina_galaxy_all.txt
Number of Upregulated Genes: 
       0 4month_unloaded_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
       1 4month_unloaded_retina_galaxy_downregulated.txt

~~~DESeq2 Results~~~
Number of DE Genes: 
       2 4month_combination_retina_galaxy_all.txt
Number of Upregulated Genes: 
       0 4month_combination_retina_galaxy_upregulated.txt
Number of Downregulated Genes: 
       2 4month_combination_retina_galaxy_downregulated.txt



### Including a Log FC requirement eliminates almost all genes from all comparisons. LFC of 2, 1, and 0.5 tested.