In [None]:
# import library
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

In [None]:
# setting
plt.rcParams['font.family']= 'sans-serif'
plt.rcParams['font.sans-serif'] = ['Arial']
plt.rcParams['font.size'] = 18
plt.rcParams["figure.dpi"] = 200

In [None]:
# data
file_path1 = "../data/ChIP-seq/ChIP_H3K4me2_H2A.Z_H2Aub_H3K27me3_WT_jmj_clf.rpkm.tsv"
df_chip1 = pd.read_csv(file_path1, sep="\t", index_col=0)

file_path2 = "../data/ChIP-seq/ChIP_H3K4me2_H2A.Z_WT_arp6_pie1.rpkm.tsv"
df_chip2 = pd.read_csv(file_path2, sep="\t", index_col=0)

file_path3 = "../data/ChIP-seq/ChIP_H3K4me2_H2A.Z_H2Aub_WT_bmi1abc.rpkm.tsv"
df_chip3 = pd.read_csv(file_path3, sep="\t", index_col=0)

In [None]:
# target genes
jmj_target = pd.read_csv("../data/list_of_target_genes/JMJ-target(n=2160).bed",sep="\t",header=None).iloc[:,3]
clf_target = pd.read_csv("../data/list_of_target_genes/CLF-target(n=3048).bed",sep="\t",header=None).iloc[:,3]
swr1_target = pd.read_csv("../data/list_of_target_genes/SWR1-C-target(n=6096).bed",sep="\t",header=None).iloc[:,3]
bmi1_target = pd.read_csv("../data/list_of_target_genes/BMI1-target(n=4982).bed",sep="\t",header=None).iloc[:,3]

In [None]:
# Fig. 4a,c,e,g
fig, ax = plt.subplots(4,2,figsize=(9,20),gridspec_kw={"hspace":0.5,"wspace":0.1})

hm_list = ["H3K27me3","H3K27me3","H2A.Z","H2Aub"]
df_list = [df_chip1,df_chip1,df_chip2,df_chip3]
gt_list = ["jmj","clf","pie1","bmi1abc"]
target_list = [jmj_target,clf_target,swr1_target,bmi1_target]
color_list = ["tab:red","blue","blue","blue"]

for i in range(4):
    for j in range(2):
        df = df_list[i]
        hm = None
        if j == 0:
            hm = hm_list[i]
        else:
            hm = "H3K4me2"
            
        gt = gt_list[i]
        mask = df.index.isin(target_list[i])
        color = color_list[i]
        
        # plot
        # non target genes
        sns.scatterplot(data=df[~mask],
                        x=f"{hm}_WT_rep1",
                        y=f"{hm}_{gt}_rep1",
                        s=2,alpha=0.5,ax=ax[i][j],color="tab:grey")
        # target genes
        sns.scatterplot(data=df[mask],
                        x=f"{hm}_WT_rep1",
                        y=f"{hm}_{gt}_rep1",
                        s=2,alpha=0.5,ax=ax[i][j],color=color)
    
        # format figure
        x = df[f"{hm}_WT_rep1"]
        ax[i][j].set_xlim(0,np.percentile(x,99))
        ax[i][j].set_ylim(0,np.percentile(x,99))
        ax[i][j].set_title(hm)
        ax[i][j].set_xlabel("")
        ax[i][j].set_ylabel("")
        ax[i][j].set_aspect('equal', adjustable='box')