# Determine DEGs in Deseq2 Data

### 1. Import Required Packages
### 2. Import Data
### 3. Determine DEGs for each celltype and time


## <br> 1. Import Required Packages

In [1]:
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import seaborn as sns

Set figure parameters.

In [2]:
%config InlineBackend.print_figure_kwargs={'facecolor' : "w"}
%config InlineBackend.figure_format='retina'
pd.options.display.max_colwidth = 200
#plt.rcParams['font.sans-serif']=['Arial']
plt.rcParams['pdf.fonttype'] = 'truetype'

## <br> 2. Import Deseq2 Data

In [3]:
Deseq2_Master = pd.read_csv('./Results/Deseq2_Master_Wald.txt', delimiter = '\t', index_col=0)

Deseq2_Master['Time'] = Deseq2_Master['Time'].astype('category')
Deseq2_Master['Time'] = Deseq2_Master['Time'].cat.reorder_categories([2,4,8,12,18,24,72])

In [4]:
Deseq2_Master

Unnamed: 0,Gene,baseMean,log2FoldChange,lfcSE,stat,pvalue,padj,Celltype,Time,Fold-Change
0,Gm42418,9721.280933,0.090394,0.450800,0.200520,0.841074,0.998335,B_Cell,2,1.064661
1,Malat1,3845.002291,-0.101792,0.159584,-0.637858,0.523566,0.998335,B_Cell,2,0.931875
2,Cmss1,1590.724138,0.309259,0.446208,0.693083,0.488257,0.998335,B_Cell,2,1.239071
3,Foxp1,795.056702,-0.041252,0.180903,-0.228032,0.819622,0.998335,B_Cell,2,0.971811
4,Camk1d,746.328996,0.123394,0.308227,0.400334,0.688911,0.998335,B_Cell,2,1.089294
...,...,...,...,...,...,...,...,...,...,...
626194,Tfpi,1.631608,-0.321517,1.136329,-0.282943,0.777220,0.999076,T_Cell,72,0.800228
626195,Tmem128,1.647822,-1.621279,1.074936,-1.508257,0.131489,0.999076,T_Cell,72,0.325047
626196,Wbp1,1.682889,-0.317524,1.098354,-0.289091,0.772512,0.999076,T_Cell,72,0.802446
626197,Zfp324,1.478046,-0.332261,1.205061,-0.275721,0.782762,0.999076,T_Cell,72,0.794291


## <br> 3. Determine DEGs for each celltype and time

In [5]:
##############
# All DEGs
##############
Hepatocyte_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Hepatocyte') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Hepatocyte_DEGs_All_Unique_List = Hepatocyte_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
Hepatocyte_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
Hepatocyte_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/Hepatocyte.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
Hepatocyte_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Hepatocyte') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

Hepatocyte_DEGs_Induced_Counts = Hepatocyte_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
Hepatocyte_Induced_DEGs_list = Hepatocyte_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
Hepatocyte_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/Hepatocyte_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
Hepatocyte_Induced_All_counts = Hepatocyte_DEGs_Induced['Gene'].value_counts()
Hepatocyte_Induced_All_Results = Hepatocyte_Induced_All_counts[Hepatocyte_Induced_All_counts == 7]
Hepatocyte_Induced_All_Results_List = pd.DataFrame(sorted(Hepatocyte_Induced_All_Results.reset_index()['Gene']))
Hepatocyte_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/Hepatocyte_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
Hepatocyte_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Hepatocyte') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

Hepatocyte_DEGs_Repressed_Counts = Hepatocyte_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
Hepatocyte_DEGs_Repressed_list = Hepatocyte_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
Hepatocyte_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/Hepatocyte_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
Hepatocyte_Repressed_All_counts = Hepatocyte_DEGs_Repressed['Gene'].value_counts()
Hepatocyte_Repressed_All_Results = Hepatocyte_Repressed_All_counts[Hepatocyte_Repressed_All_counts == 7]
Hepatocyte_Repressed_All_Results_List = pd.DataFrame(sorted(Hepatocyte_Repressed_All_Results.reset_index()['Gene']))
Hepatocyte_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/Hepatocyte_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
Hepatocyte_Counts = pd.concat([Hepatocyte_DEGs_Induced_Counts, Hepatocyte_DEGs_Repressed_Counts], axis=1)
Hepatocyte_Counts = Hepatocyte_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
Hepatocyte_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Hepatocyte')]

Hepatocyte_All_All_Genes = pd.DataFrame(Hepatocyte_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
Hepatocyte_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/Hepatocyte_All_Genes.txt', sep='\t', index=False, header=False)



print("Hepatocyte")
print("----------------------------")
print("Induced in all time points:", len(Hepatocyte_Induced_All_Results))
print()
print("Repressed in all time points:", len(Hepatocyte_Repressed_All_Results))
print()
print("Total number of DEGs:", len(Hepatocyte_DEGs_All_Unique_List))
print("--- Induced:", len(Hepatocyte_Induced_DEGs_list))
print("--- Repressed:", len(Hepatocyte_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(Hepatocyte_All_All_Genes))
print()
print(Hepatocyte_Counts)

Hepatocyte
----------------------------
Induced in all time points: 77

Repressed in all time points: 1

Total number of DEGs: 4785
--- Induced: 2360
--- Repressed: 2728

All Genes in Celltype: 17250

  Time Time  Induced  Repressed
0    2    2      503        239
1    4    4     1006        940
2    8    8      291        155
3   12   12      722        760
4   18   18      433        542
5   24   24      292        282
6   72   72      882        907


In [6]:
##############
# All DEGs
##############
LSEC_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'EC') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

LSEC_DEGs_All_Unique_List = LSEC_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
LSEC_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
LSEC_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/EC.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
LSEC_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'EC') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

LSEC_DEGs_Induced_Counts = LSEC_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
LSEC_Induced_DEGs_list = LSEC_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
LSEC_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/EC_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
LSEC_Induced_All_counts = LSEC_DEGs_Induced['Gene'].value_counts()
LSEC_Induced_All_Results = LSEC_Induced_All_counts[LSEC_Induced_All_counts == 7]
LSEC_Induced_All_Results_List = pd.DataFrame(sorted(LSEC_Induced_All_Results.reset_index()['Gene']))
LSEC_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/EC_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
LSEC_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'EC') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

LSEC_DEGs_Repressed_Counts = LSEC_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
LSEC_DEGs_Repressed_list = LSEC_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
LSEC_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/EC_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
LSEC_Repressed_All_counts = LSEC_DEGs_Repressed['Gene'].value_counts()
LSEC_Repressed_All_Results = LSEC_Repressed_All_counts[LSEC_Repressed_All_counts == 7]
LSEC_Repressed_All_Results_List = pd.DataFrame(sorted(LSEC_Repressed_All_Results.reset_index()['Gene']))
LSEC_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/EC_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
LSEC_Counts = pd.concat([LSEC_DEGs_Induced_Counts, LSEC_DEGs_Repressed_Counts], axis=1)
LSEC_Counts = LSEC_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
LSEC_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'EC')]

LSEC_All_All_Genes = pd.DataFrame(LSEC_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
LSEC_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/EC_All_Genes.txt', sep='\t', index=False, header=False)



print("LSEC")
print("----------------------------")
print("Induced in all time points:", len(LSEC_Induced_All_Results))
print()
print("Repressed in all time points:", len(LSEC_Repressed_All_Results))
print()
print("Total number of DEGs:", len(LSEC_DEGs_All_Unique_List))
print("--- Induced:", len(LSEC_Induced_DEGs_list))
print("--- Repressed:", len(LSEC_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(LSEC_All_All_Genes))
print()
print(LSEC_Counts)

LSEC
----------------------------
Induced in all time points: 16

Repressed in all time points: 0

Total number of DEGs: 710
--- Induced: 446
--- Repressed: 267

All Genes in Celltype: 13426

  Time Time  Induced  Repressed
0    2    2      247         79
1    4    4      159         38
2    8    8       57         13
3   12   12      100         68
4   18   18       54         12
5   24   24       45          6
6   72   72      130         90


In [7]:
##############
# All DEGs
##############
HSC_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'HSC') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

HSC_DEGs_All_Unique_List = HSC_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
HSC_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
HSC_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/HSC.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
HSC_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'HSC') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

HSC_DEGs_Induced_Counts = HSC_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
HSC_Induced_DEGs_list = HSC_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
HSC_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/HSC_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
HSC_Induced_All_counts = HSC_DEGs_Induced['Gene'].value_counts()
HSC_Induced_All_Results = HSC_Induced_All_counts[HSC_Induced_All_counts == 7]
HSC_Induced_All_Results_List = pd.DataFrame(sorted(HSC_Induced_All_Results.reset_index()['Gene']))
HSC_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/HSC_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
HSC_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'HSC') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

HSC_DEGs_Repressed_Counts = HSC_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
HSC_DEGs_Repressed_list = HSC_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
HSC_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/HSC_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
HSC_Repressed_All_counts = HSC_DEGs_Repressed['Gene'].value_counts()
HSC_Repressed_All_Results = HSC_Repressed_All_counts[HSC_Repressed_All_counts == 7]
HSC_Repressed_All_Results_List = pd.DataFrame(sorted(HSC_Repressed_All_Results.reset_index()['Gene']))
HSC_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/HSC_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
HSC_Counts = pd.concat([HSC_DEGs_Induced_Counts, HSC_DEGs_Repressed_Counts], axis=1)
HSC_Counts = HSC_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
HSC_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'HSC')]

HSC_All_All_Genes = pd.DataFrame(HSC_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
HSC_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/HSC_All_Genes.txt', sep='\t', index=False, header=False)



print("HSC")
print("----------------------------")
print("Induced in all time points:", len(HSC_Induced_All_Results))
print()
print("Repressed in all time points:", len(HSC_Repressed_All_Results))
print()
print("Total number of DEGs:", len(HSC_DEGs_All_Unique_List))
print("--- Induced:", len(HSC_Induced_DEGs_list))
print("--- Repressed:", len(HSC_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(HSC_All_All_Genes))
print()
print(HSC_Counts)

HSC
----------------------------
Induced in all time points: 9

Repressed in all time points: 0

Total number of DEGs: 373
--- Induced: 239
--- Repressed: 136

All Genes in Celltype: 12232

  Time Time  Induced  Repressed
0    2    2       39          6
1    4    4       89         16
2    8    8       28          5
3   12   12       56         27
4   18   18      118         54
5   24   24       34          8
6   72   72       57         36


In [8]:
##############
# All DEGs
##############
Macrophage_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Macrophage') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Macrophage_DEGs_All_Unique_List = Macrophage_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
Macrophage_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
Macrophage_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/Macrophage.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
Macrophage_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Macrophage') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

Macrophage_DEGs_Induced_Counts = Macrophage_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
Macrophage_Induced_DEGs_list = Macrophage_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
Macrophage_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/Macrophage_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
Macrophage_Induced_All_counts = Macrophage_DEGs_Induced['Gene'].value_counts()
Macrophage_Induced_All_Results = Macrophage_Induced_All_counts[Macrophage_Induced_All_counts == 7]
Macrophage_Induced_All_Results_List = pd.DataFrame(sorted(Macrophage_Induced_All_Results.reset_index()['Gene']))
Macrophage_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/Macrophage_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
Macrophage_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Macrophage') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

Macrophage_DEGs_Repressed_Counts = Macrophage_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
Macrophage_DEGs_Repressed_list = Macrophage_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
Macrophage_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/Macrophage_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
Macrophage_Repressed_All_counts = Macrophage_DEGs_Repressed['Gene'].value_counts()
Macrophage_Repressed_All_Results = Macrophage_Repressed_All_counts[Macrophage_Repressed_All_counts == 7]
Macrophage_Repressed_All_Results_List = pd.DataFrame(sorted(Macrophage_Repressed_All_Results.reset_index()['Gene']))
Macrophage_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/Macrophage_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
Macrophage_Counts = pd.concat([Macrophage_DEGs_Induced_Counts, Macrophage_DEGs_Repressed_Counts], axis=1)
Macrophage_Counts = Macrophage_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
Macrophage_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Macrophage')]

Macrophage_All_All_Genes = pd.DataFrame(Macrophage_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
Macrophage_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/Macrophage_All_Genes.txt', sep='\t', index=False, header=False)



print("Macrophage")
print("----------------------------")
print("Induced in all time points:", len(Macrophage_Induced_All_Results))
print()
print("Repressed in all time points:", len(Macrophage_Repressed_All_Results))
print()
print("Total number of DEGs:", len(Macrophage_DEGs_All_Unique_List))
print("--- Induced:", len(Macrophage_Induced_DEGs_list))
print("--- Repressed:", len(Macrophage_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(Macrophage_All_All_Genes))
print()
print(Macrophage_Counts)

Macrophage
----------------------------
Induced in all time points: 5

Repressed in all time points: 0

Total number of DEGs: 161
--- Induced: 93
--- Repressed: 68

All Genes in Celltype: 11242

  Time Time  Induced  Repressed
0    2    2       33          5
1    4    4       62         24
2    8    8       16          1
3   12   12       27          8
4   18   18       18          0
5   24   24       13          2
6   72   72       23         31


In [9]:
##############
# All DEGs
##############
B_Cell_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'B_Cell') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

B_Cell_DEGs_All_Unique_List = B_Cell_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
B_Cell_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
B_Cell_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/B_Cell.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
B_Cell_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'B_Cell') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

B_Cell_DEGs_Induced_Counts = B_Cell_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
B_Cell_Induced_DEGs_list = B_Cell_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
B_Cell_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/B_Cell_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
B_Cell_Induced_All_counts = B_Cell_DEGs_Induced['Gene'].value_counts()
B_Cell_Induced_All_Results = B_Cell_Induced_All_counts[B_Cell_Induced_All_counts == 7]
B_Cell_Induced_All_Results_List = pd.DataFrame(sorted(B_Cell_Induced_All_Results.reset_index()['Gene']))
B_Cell_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/B_Cell_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
B_Cell_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'B_Cell') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

B_Cell_DEGs_Repressed_Counts = B_Cell_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
B_Cell_DEGs_Repressed_list = B_Cell_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
B_Cell_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/B_Cell_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
B_Cell_Repressed_All_counts = B_Cell_DEGs_Repressed['Gene'].value_counts()
B_Cell_Repressed_All_Results = B_Cell_Repressed_All_counts[B_Cell_Repressed_All_counts == 7]
B_Cell_Repressed_All_Results_List = pd.DataFrame(sorted(B_Cell_Repressed_All_Results.reset_index()['Gene']))
B_Cell_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/B_Cell_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
B_Cell_Counts = pd.concat([B_Cell_DEGs_Induced_Counts, B_Cell_DEGs_Repressed_Counts], axis=1)
B_Cell_Counts = B_Cell_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
B_Cell_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'B_Cell')]

B_Cell_All_All_Genes = pd.DataFrame(B_Cell_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
B_Cell_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/B_Cell_All_Genes.txt', sep='\t', index=False, header=False)



print("B_Cell")
print("----------------------------")
print("Induced in all time points:", len(B_Cell_Induced_All_Results))
print()
print("Repressed in all time points:", len(B_Cell_Repressed_All_Results))
print()
print("Total number of DEGs:", len(B_Cell_DEGs_All_Unique_List))
print("--- Induced:", len(B_Cell_Induced_DEGs_list))
print("--- Repressed:", len(B_Cell_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(B_Cell_All_All_Genes))
print()
print(B_Cell_Counts)

B_Cell
----------------------------
Induced in all time points: 4

Repressed in all time points: 0

Total number of DEGs: 128
--- Induced: 86
--- Repressed: 43

All Genes in Celltype: 9128

  Time Time  Induced  Repressed
0    2    2       24          4
1    4    4       39         10
2    8    8        9          1
3   12   12        6         16
4   18   18       48          3
5   24   24       11          2
6   72   72       18          8


In [10]:
##############
# All DEGs
##############
T_Cell_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'T_Cell') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

T_Cell_DEGs_All_Unique_List = T_Cell_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
T_Cell_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
T_Cell_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/T_Cell.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
T_Cell_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'T_Cell') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

T_Cell_DEGs_Induced_Counts = T_Cell_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
T_Cell_Induced_DEGs_list = T_Cell_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
T_Cell_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/T_Cell_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
T_Cell_Induced_All_counts = T_Cell_DEGs_Induced['Gene'].value_counts()
T_Cell_Induced_All_Results = T_Cell_Induced_All_counts[T_Cell_Induced_All_counts == 7]
T_Cell_Induced_All_Results_List = pd.DataFrame(sorted(T_Cell_Induced_All_Results.reset_index()['Gene']))
T_Cell_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/T_Cell_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
T_Cell_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'T_Cell') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

T_Cell_DEGs_Repressed_Counts = T_Cell_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
T_Cell_DEGs_Repressed_list = T_Cell_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
T_Cell_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/T_Cell_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
T_Cell_Repressed_All_counts = T_Cell_DEGs_Repressed['Gene'].value_counts()
T_Cell_Repressed_All_Results = T_Cell_Repressed_All_counts[T_Cell_Repressed_All_counts == 7]
T_Cell_Repressed_All_Results_List = pd.DataFrame(sorted(T_Cell_Repressed_All_Results.reset_index()['Gene']))
T_Cell_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/T_Cell_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
T_Cell_Counts = pd.concat([T_Cell_DEGs_Induced_Counts, T_Cell_DEGs_Repressed_Counts], axis=1)
T_Cell_Counts = T_Cell_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
T_Cell_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'T_Cell')]

T_Cell_All_All_Genes = pd.DataFrame(T_Cell_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
T_Cell_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/T_Cell_All_Genes.txt', sep='\t', index=False, header=False)



print("T_Cell")
print("----------------------------")
print("Induced in all time points:", len(T_Cell_Induced_All_Results))
print()
print("Repressed in all time points:", len(T_Cell_Repressed_All_Results))
print()
print("Total number of DEGs:", len(T_Cell_DEGs_All_Unique_List))
print("--- Induced:", len(T_Cell_Induced_DEGs_list))
print("--- Repressed:", len(T_Cell_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(T_Cell_All_All_Genes))
print()
print(T_Cell_Counts)

T_Cell
----------------------------
Induced in all time points: 5

Repressed in all time points: 0

Total number of DEGs: 140
--- Induced: 114
--- Repressed: 26

All Genes in Celltype: 9533

  Time Time  Induced  Repressed
0    2    2       42          3
1    4    4       67          7
2    8    8       11          3
3   12   12       36          3
4   18   18       33          1
5   24   24       18          1
6   72   72       18          9


In [11]:
##############
# All DEGs
##############
PF_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'PF') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

PF_DEGs_All_Unique_List = PF_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
PF_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
PF_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/PF.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
PF_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'PF') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

PF_DEGs_Induced_Counts = PF_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
PF_Induced_DEGs_list = PF_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
PF_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/PF_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
PF_Induced_All_counts = PF_DEGs_Induced['Gene'].value_counts()
PF_Induced_All_Results = PF_Induced_All_counts[PF_Induced_All_counts == 7]
PF_Induced_All_Results_List = pd.DataFrame(sorted(PF_Induced_All_Results.reset_index()['Gene']))
PF_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/PF_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
PF_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'PF') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

PF_DEGs_Repressed_Counts = PF_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
PF_DEGs_Repressed_list = PF_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
PF_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/PF_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
PF_Repressed_All_counts = PF_DEGs_Repressed['Gene'].value_counts()
PF_Repressed_All_Results = PF_Repressed_All_counts[PF_Repressed_All_counts == 7]
PF_Repressed_All_Results_List = pd.DataFrame(sorted(PF_Repressed_All_Results.reset_index()['Gene']))
PF_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/PF_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
PF_Counts = pd.concat([PF_DEGs_Induced_Counts, PF_DEGs_Repressed_Counts], axis=1)
PF_Counts = PF_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
PF_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'PF')]

PF_All_All_Genes = pd.DataFrame(PF_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
PF_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/PF_All_Genes.txt', sep='\t', index=False, header=False)



print("PF")
print("----------------------------")
print("Induced in all time points:", len(PF_Induced_All_Results))
print()
print("Repressed in all time points:", len(PF_Repressed_All_Results))
print()
print("Total number of DEGs:", len(PF_DEGs_All_Unique_List))
print("--- Induced:", len(PF_Induced_DEGs_list))
print("--- Repressed:", len(PF_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(PF_All_All_Genes))
print()
print(PF_Counts)

PF
----------------------------
Induced in all time points: 1

Repressed in all time points: 0

Total number of DEGs: 33
--- Induced: 30
--- Repressed: 3

All Genes in Celltype: 6374

  Time Time  Induced  Repressed
0    2    2       10          0
1    4    4       18          2
2    8    8        4          1
3   12   12        2          0
4   18   18        4          0
5   24   24        7          0
6   72   72        1          0


In [12]:
##############
# All DEGs
##############
Cholangiocyte_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Cholangiocyte') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Cholangiocyte_DEGs_All_Unique_List = Cholangiocyte_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
Cholangiocyte_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
Cholangiocyte_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/Cholangiocyte.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
Cholangiocyte_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Cholangiocyte') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

Cholangiocyte_DEGs_Induced_Counts = Cholangiocyte_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
Cholangiocyte_Induced_DEGs_list = Cholangiocyte_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
Cholangiocyte_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/Cholangiocyte_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
Cholangiocyte_Induced_All_counts = Cholangiocyte_DEGs_Induced['Gene'].value_counts()
Cholangiocyte_Induced_All_Results = Cholangiocyte_Induced_All_counts[Cholangiocyte_Induced_All_counts == 7]
Cholangiocyte_Induced_All_Results_List = pd.DataFrame(sorted(Cholangiocyte_Induced_All_Results.reset_index()['Gene']))
Cholangiocyte_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/Cholangiocyte_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
Cholangiocyte_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Cholangiocyte') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

Cholangiocyte_DEGs_Repressed_Counts = Cholangiocyte_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
Cholangiocyte_DEGs_Repressed_list = Cholangiocyte_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
Cholangiocyte_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/Cholangiocyte_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
Cholangiocyte_Repressed_All_counts = Cholangiocyte_DEGs_Repressed['Gene'].value_counts()
Cholangiocyte_Repressed_All_Results = Cholangiocyte_Repressed_All_counts[Cholangiocyte_Repressed_All_counts == 7]
Cholangiocyte_Repressed_All_Results_List = pd.DataFrame(sorted(Cholangiocyte_Repressed_All_Results.reset_index()['Gene']))
Cholangiocyte_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/Cholangiocyte_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
Cholangiocyte_Counts = pd.concat([Cholangiocyte_DEGs_Induced_Counts, Cholangiocyte_DEGs_Repressed_Counts], axis=1)
Cholangiocyte_Counts = Cholangiocyte_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
Cholangiocyte_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Cholangiocyte')]

Cholangiocyte_All_All_Genes = pd.DataFrame(Cholangiocyte_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
Cholangiocyte_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/Cholangiocyte_All_Genes.txt', sep='\t', index=False, header=False)



print("Cholangiocyte")
print("----------------------------")
print("Induced in all time points:", len(Cholangiocyte_Induced_All_Results))
print()
print("Repressed in all time points:", len(Cholangiocyte_Repressed_All_Results))
print()
print("Total number of DEGs:", len(Cholangiocyte_DEGs_All_Unique_List))
print("--- Induced:", len(Cholangiocyte_Induced_DEGs_list))
print("--- Repressed:", len(Cholangiocyte_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(Cholangiocyte_All_All_Genes))
print()
print(Cholangiocyte_Counts)

Cholangiocyte
----------------------------
Induced in all time points: 0

Repressed in all time points: 0

Total number of DEGs: 14
--- Induced: 12
--- Repressed: 2

All Genes in Celltype: 5574

  Time Time  Induced  Repressed
0    2    2        1          0
1    4    4       10          2
2    8    8        0          0
3   12   12        3          0
4   18   18        5          0
5   24   24        1          0
6   72   72        2          0


In [13]:
##############
# All DEGs
##############
pDC_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'pDC') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

pDC_DEGs_All_Unique_List = pDC_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
pDC_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
pDC_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/pDC.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
pDC_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'pDC') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

pDC_DEGs_Induced_Counts = pDC_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
pDC_Induced_DEGs_list = pDC_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
pDC_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/pDC_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
pDC_Induced_All_counts = pDC_DEGs_Induced['Gene'].value_counts()
pDC_Induced_All_Results = pDC_Induced_All_counts[pDC_Induced_All_counts == 7]
pDC_Induced_All_Results_List = pd.DataFrame(sorted(pDC_Induced_All_Results.reset_index()['Gene']))
pDC_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/pDC_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
pDC_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'pDC') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

pDC_DEGs_Repressed_Counts = pDC_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
pDC_DEGs_Repressed_list = pDC_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
pDC_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/pDC_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
pDC_Repressed_All_counts = pDC_DEGs_Repressed['Gene'].value_counts()
pDC_Repressed_All_Results = pDC_Repressed_All_counts[pDC_Repressed_All_counts == 7]
pDC_Repressed_All_Results_List = pd.DataFrame(sorted(pDC_Repressed_All_Results.reset_index()['Gene']))
pDC_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/pDC_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
pDC_Counts = pd.concat([pDC_DEGs_Induced_Counts, pDC_DEGs_Repressed_Counts], axis=1)
pDC_Counts = pDC_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
pDC_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'pDC')]

pDC_All_All_Genes = pd.DataFrame(pDC_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
pDC_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/pDC_All_Genes.txt', sep='\t', index=False, header=False)



print("pDC")
print("----------------------------")
print("Induced in all time points:", len(pDC_Induced_All_Results))
print()
print("Repressed in all time points:", len(pDC_Repressed_All_Results))
print()
print("Total number of DEGs:", len(pDC_DEGs_All_Unique_List))
print("--- Induced:", len(pDC_Induced_DEGs_list))
print("--- Repressed:", len(pDC_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(pDC_All_All_Genes))
print()
print(pDC_Counts)

pDC
----------------------------
Induced in all time points: 0

Repressed in all time points: 0

Total number of DEGs: 5
--- Induced: 2
--- Repressed: 3

All Genes in Celltype: 3049

  Time Time  Induced  Repressed
0    2    2        0          0
1    4    4        1          0
2    8    8        1          0
3   12   12        1          3
4   18   18        1          0
5   24   24        0          0
6   72   72        0          0


In [14]:
##############
# All DEGs
##############
Neutrophil_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Neutrophil') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Neutrophil_DEGs_All_Unique_List = Neutrophil_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
Neutrophil_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)
Neutrophil_DEGs_All_Unique_List.to_csv('./Results/04b_All_DEGs/Neutrophil.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced Only
############################
Neutrophil_DEGs_Induced = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Neutrophil') &
                               (Deseq2_Master['Fold-Change'] >= 1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]

Neutrophil_DEGs_Induced_Counts = Neutrophil_DEGs_Induced.groupby('Time').size().reset_index(name='Induced')
Neutrophil_Induced_DEGs_list = Neutrophil_DEGs_Induced['Gene'].drop_duplicates(keep='first').sort_values()
Neutrophil_Induced_DEGs_list.to_csv('./Results/04b_All_DEGs/Neutrophil_Induced.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Induced in All 7 time points
############################
Neutrophil_Induced_All_counts = Neutrophil_DEGs_Induced['Gene'].value_counts()
Neutrophil_Induced_All_Results = Neutrophil_Induced_All_counts[Neutrophil_Induced_All_counts == 7]
Neutrophil_Induced_All_Results_List = pd.DataFrame(sorted(Neutrophil_Induced_All_Results.reset_index()['Gene']))
Neutrophil_Induced_All_Results_List.to_csv('./Results/04b_All_DEGs/Neutrophil_Induced_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed Only
############################
Neutrophil_DEGs_Repressed = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Neutrophil') &
                               (Deseq2_Master['Fold-Change'] <= 1/1.5) &
                               (Deseq2_Master['padj'] <= 0.05)]                                                                      

Neutrophil_DEGs_Repressed_Counts = Neutrophil_DEGs_Repressed.groupby('Time').size().reset_index(name='Repressed')   
Neutrophil_DEGs_Repressed_list = Neutrophil_DEGs_Repressed['Gene'].drop_duplicates(keep='first').sort_values()
Neutrophil_DEGs_Repressed_list.to_csv('./Results/04b_All_DEGs/Neutrophil_Repressed.txt', sep='\t', index=False, header=False)


############################
## All DEGs - Repressed in All 7 time points
############################
Neutrophil_Repressed_All_counts = Neutrophil_DEGs_Repressed['Gene'].value_counts()
Neutrophil_Repressed_All_Results = Neutrophil_Repressed_All_counts[Neutrophil_Repressed_All_counts == 7]
Neutrophil_Repressed_All_Results_List = pd.DataFrame(sorted(Neutrophil_Repressed_All_Results.reset_index()['Gene']))
Neutrophil_Repressed_All_Results_List.to_csv('./Results/04b_All_DEGs/Neutrophil_Repressed_In_All_7_Timepoints.txt', sep='\t', index=False, header=False)



############################
## Make All DEG count Table
############################
Neutrophil_Counts = pd.concat([Neutrophil_DEGs_Induced_Counts, Neutrophil_DEGs_Repressed_Counts], axis=1)
Neutrophil_Counts = Neutrophil_Counts[['Time','Induced', 'Repressed']]


############################
#All Genes in Celltype(Background)
############################
Neutrophil_All_Genes = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Neutrophil')]

Neutrophil_All_All_Genes = pd.DataFrame(Neutrophil_All_Genes['Gene'].drop_duplicates(keep='first').tolist())
Neutrophil_All_All_Genes.to_csv('./Results/04b_All_Genes_In_Celltype/Neutrophil_All_Genes.txt', sep='\t', index=False, header=False)



print("Neutrophil")
print("----------------------------")
print("Induced in all time points:", len(Neutrophil_Induced_All_Results))
print()
print("Repressed in all time points:", len(Neutrophil_Repressed_All_Results))
print()
print("Total number of DEGs:", len(Neutrophil_DEGs_All_Unique_List))
print("--- Induced:", len(Neutrophil_Induced_DEGs_list))
print("--- Repressed:", len(Neutrophil_DEGs_Repressed_list))
print()
print("All Genes in Celltype:",len(Neutrophil_All_All_Genes))
print()
print(Neutrophil_Counts)

Neutrophil
----------------------------
Induced in all time points: 0

Repressed in all time points: 0

Total number of DEGs: 0
--- Induced: 0
--- Repressed: 0

All Genes in Celltype: 1649

  Time Time  Induced  Repressed
0    2    2        0          0
1    4    4        0          0
2    8    8        0          0
3   12   12        0          0
4   18   18        0          0
5   24   24        0          0
6   72   72        0          0
