# Determine DEGs in Deseq2 Data

### 1. Import Required Packages
### 2. Import Data
### 3. Concat All Data Into One Dataframe


## <br> 1. Import Required Packages

In [1]:
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import seaborn as sns

## <br> 2. Import Deseq2 Data

In [2]:
Deseq2_Master = pd.read_csv('./Results/Deseq2_Master_Wald.txt', 
                            delimiter = '\t',
                            index_col=0)

Deseq2_Master['Time'] = Deseq2_Master['Time'].astype('category')
Deseq2_Master['Time'] = Deseq2_Master['Time'].cat.reorder_categories([2,4,8,12,18,24,72])

Deseq2_Master.sort_values(ascending=False, by='Fold-Change', inplace=True)

Deseq2_Master

Unnamed: 0,Gene,baseMean,log2FoldChange,lfcSE,stat,pvalue,padj,Celltype,Time,Fold-Change
136318,H19,11.489521,26.047240,7.733220,3.368227,,,Hepatocyte,4,6.934266e+07
151979,Xlr4a,11.669872,19.768937,2.478349,7.976657,1.503501e-15,9.393988e-13,Hepatocyte,8,8.933937e+05
119068,H19,11.489521,14.665253,7.759227,1.890041,,,Hepatocyte,2,2.598251e+04
194509,Ahrr,727.122219,12.474705,1.214853,10.268490,9.772195e-25,1.443175e-21,Hepatocyte,24,5.691943e+03
132154,Ecel1,53.945408,12.276662,1.283328,9.566272,1.108296e-21,4.806595e-19,Hepatocyte,4,4.961847e+03
...,...,...,...,...,...,...,...,...,...,...
134791,Ugt2b38,9.733622,-7.592916,2.388217,-3.179324,1.476191e-03,1.644815e-02,Hepatocyte,4,5.179700e-03
168588,Gm32468,17.316963,-7.881576,2.381834,-3.309036,9.361779e-04,1.379215e-02,Hepatocyte,12,4.240424e-03
134312,Gm45282,14.413738,-7.998759,1.412182,-5.664112,1.477876e-08,1.120933e-06,Hepatocyte,4,3.909610e-03
283399,Cxcl10,4.489016,-17.397751,2.027937,-8.579041,9.566707e-18,,HSC,18,5.791019e-06


## <br> 3. Import DRE and AHR Chip Data

In [3]:
pDREs_Master = pd.read_csv('./Data/pDREs.txt', 
                            delimiter = '\t')

pDREs_Master

Unnamed: 0,Gene,DRE
0,Xkr4,1
1,Rp1,1
2,Mrpl15,1
3,Lypla1,1
4,Tcea1,1
...,...,...
16811,Gm21704,1
16812,Gm21708,1
16813,Gm20857,1
16814,Gm20858,1


In [4]:
AHR_Master = pd.read_csv('./Data/AHR.txt', 
                            delimiter = '\t')

AHR_Master

Unnamed: 0,Gene,AhR
0,Marchf2,1
1,Marchf4,1
2,Marchf10,1
3,Marchf11,1
4,Septin2,1
...,...,...
6624,Zw10,1
6625,Zwint,1
6626,Zyg11a,1
6627,Zyg11b,1


## <br> 4. Determine DEGs for each celltype and dose

In [5]:
Hepatocyte_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Hepatocyte') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Hepatocyte_DEGs_All_Unique_List = Hepatocyte_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#Hepatocyte_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [6]:
LSEC_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'EC') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

LSEC_DEGs_All_Unique_List = LSEC_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#LSEC_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [7]:
HSC_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'HSC') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

HSC_DEGs_All_Unique_List = HSC_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#HSC_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [8]:
Macrophage_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Macrophage') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Macrophage_DEGs_All_Unique_List = Macrophage_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#Macrophage_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [9]:
B_Cell_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'B_Cell') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

B_Cell_DEGs_All_Unique_List = B_Cell_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#B_Cell_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [10]:
T_Cell_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'T_Cell') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

T_Cell_DEGs_All_Unique_List = T_Cell_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#T_Cell_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [11]:
PF_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'PF') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

PF_DEGs_All_Unique_List = PF_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#PF_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [12]:
Cholangiocyte_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Cholangiocyte') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Cholangiocyte_DEGs_All_Unique_List = Cholangiocyte_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#Cholangiocyte_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [13]:
pDC_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'pDC') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

pDC_DEGs_All_Unique_List = pDC_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#pDC_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


In [14]:
Neutrophil_DEGs_All_Unique = Deseq2_Master[(Deseq2_Master['Celltype'] == 'Neutrophil') &
                                           ((Deseq2_Master['Fold-Change'] >= 1.5) | (Deseq2_Master['Fold-Change'] <= 1/1.5)) &
                                           (Deseq2_Master['padj'] <= 0.05)]

Neutrophil_DEGs_All_Unique_List = Neutrophil_DEGs_All_Unique[['Gene']].drop_duplicates(keep='first').copy()
#Neutrophil_DEGs_All_Unique_List.sort_values(by='Gene', inplace=True)


## <br> 4. Find Unique DEGs to Each Celltype

In [15]:
filtered_df = Hepatocyte_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_Hepatocyte.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_Hepatocyte.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_Hepatocyte.txt', sep='\t', index=False, header=False)


print("Hepatocyte")
print("----------------------------")
print("All DEGs:", len(Hepatocyte_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

Hepatocyte
----------------------------
All DEGs: 4785

Unique DEGs: 4071

Unique DEGs with DRE: 2916

Unique DEGs with AHR Binding: 1550



In [16]:
filtered_df

Unnamed: 0,Gene
151979,Xlr4a
132154,Ecel1
164262,Nptx1
220393,4930503O07Rik
134423,Smcp
...,...
168033,2310034O05Rik
132513,Sult3a1
170400,Sult2a4
134791,Ugt2b38


In [17]:
filtered_df = LSEC_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_EC.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_EC.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_EC.txt', sep='\t', index=False, header=False)


print("EC")
print("----------------------------")
print("All DEGs:", len(LSEC_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

EC
----------------------------
All DEGs: 710

Unique DEGs: 226

Unique DEGs with DRE: 183

Unique DEGs with AHR Binding: 102



In [18]:
filtered_df = HSC_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_HSC.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_HSC.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_HSC.txt', sep='\t', index=False, header=False)


print("HSC")
print("----------------------------")
print("All DEGs:", len(HSC_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

HSC
----------------------------
All DEGs: 373

Unique DEGs: 86

Unique DEGs with DRE: 79

Unique DEGs with AHR Binding: 40



In [19]:
filtered_df = Macrophage_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_Macrophage.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_Macrophage.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_Macrophage.txt', sep='\t', index=False, header=False)


print("Macrophage")
print("----------------------------")
print("All DEGs:", len(Macrophage_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

Macrophage
----------------------------
All DEGs: 161

Unique DEGs: 6

Unique DEGs with DRE: 6

Unique DEGs with AHR Binding: 2



In [20]:
filtered_df = B_Cell_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_B_Cell.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_B_Cell.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_B_Cell.txt', sep='\t', index=False, header=False)


print("B_Cell")
print("----------------------------")
print("All DEGs:", len(B_Cell_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

B_Cell
----------------------------
All DEGs: 128

Unique DEGs: 5

Unique DEGs with DRE: 5

Unique DEGs with AHR Binding: 5



In [21]:
filtered_df = T_Cell_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_T_Cell.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_T_Cell.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_T_Cell.txt', sep='\t', index=False, header=False)


print("T_Cell")
print("----------------------------")
print("All DEGs:", len(T_Cell_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

T_Cell
----------------------------
All DEGs: 140

Unique DEGs: 9

Unique DEGs with DRE: 9

Unique DEGs with AHR Binding: 5



In [22]:
filtered_df = PF_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_PF.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_PF.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_PF.txt', sep='\t', index=False, header=False)


print("PF")
print("----------------------------")
print("All DEGs:", len(PF_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

PF
----------------------------
All DEGs: 33

Unique DEGs: 7

Unique DEGs with DRE: 4

Unique DEGs with AHR Binding: 3



In [23]:
filtered_df = Cholangiocyte_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_Cholangiocyte.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_Cholangiocyte.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_Cholangiocyte.txt', sep='\t', index=False, header=False)


print("Cholangiocyte")
print("----------------------------")
print("All DEGs:", len(Cholangiocyte_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

Cholangiocyte
----------------------------
All DEGs: 14

Unique DEGs: 2

Unique DEGs with DRE: 2

Unique DEGs with AHR Binding: 1



In [24]:
filtered_df = pDC_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Neutrophil_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_pDC.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_pDC.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_pDC.txt', sep='\t', index=False, header=False)


print("pDC")
print("----------------------------")
print("All DEGs:", len(pDC_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

pDC
----------------------------
All DEGs: 5

Unique DEGs: 0

Unique DEGs with DRE: 0

Unique DEGs with AHR Binding: 0



In [25]:
filtered_df = Neutrophil_DEGs_All_Unique_List.copy()

filtered_df = filtered_df[~filtered_df['Gene'].isin(Hepatocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(LSEC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(HSC_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Macrophage_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(B_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(T_Cell_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(PF_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(Cholangiocyte_DEGs_All_Unique_List['Gene'])]
filtered_df = filtered_df[~filtered_df['Gene'].isin(pDC_DEGs_All_Unique_List['Gene'])]

filtered_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs/Unique_to_Neutrophil.txt', sep='\t', index=False, header=False)

merged_df = pd.merge(filtered_df, pDREs_Master, on='Gene', how='inner')
merged_df = merged_df.drop('DRE', axis=1)
merged_df.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_DREs/Unique_with_DREs_to_Neutrophil.txt', sep='\t', index=False, header=False)

merged_df2 = pd.merge(filtered_df, AHR_Master, on='Gene', how='inner')
merged_df2 = merged_df2.drop('AhR', axis=1)
merged_df2.to_csv('./Results/04d_Unique_to_Celltypes_DEGs_with_AHR/Unique_with_AHR_Binding_to_Neutrophil.txt', sep='\t', index=False, header=False)


print("Neutrophil")
print("----------------------------")
print("All DEGs:", len(Neutrophil_DEGs_All_Unique_List))
print()
print("Unique DEGs:", len(filtered_df))
print()
print("Unique DEGs with DRE:", len(merged_df))
print()
print("Unique DEGs with AHR Binding:", len(merged_df2))
print()

Neutrophil
----------------------------
All DEGs: 0

Unique DEGs: 0

Unique DEGs with DRE: 0

Unique DEGs with AHR Binding: 0

