# Motifs that were enriched in categorized fragments responding to the depletion

In [1]:
import os
import numpy as np
import pandas as pd

In [2]:
def get_homer_top_motifs(filename, ntop=10):
    try:
        homer_df = pd.read_csv(filename, sep="\t")
        return homer_df.loc[:ntop-1, "Motif Name"].to_list()
    except FileNotFoundError:
        return [np.nan for _ in range(ntop)]


def get_meme_top_motifs(filename, ntop=10):
    meme_df = pd.read_csv(filename, sep="\t")
    return meme_df.loc[:ntop-1, "motif_ID"].to_list()

# Top 10 motifs for each ko lines by enhancer category

In [3]:
categories = ["peaks_vs_notpeaks", "responsive_vs_nonresponsive", "induced_vs_repressed", "repressed_vs_induced"]
ko_lines = ["ATF2", "CTCF", "FOXA1", "LEF1", "SCRT1", "TCF7L2", "16P12_1"]
store_dir = "../data/"

def get_homer_file(store_dir, ko, cat):
    homer_file = os.path.join(store_dir, ko, "homer", cat, f"knownResults.txt")
    return homer_file

def get_meme_file(store_dir, ko, cat):
    meme_file = os.path.join(store_dir, ko, "meme", cat, f"ame.tsv")
    return meme_file

def create_ko_specific_df(store_dir, ko, categories):
    data_dict = {f"{c}_{method}":[] for c in categories for method in ["homer", "meme"]}
    for c in categories:
        homer_file = get_homer_file(store_dir, ko, c)
        homer_motifs = get_homer_top_motifs(homer_file)
        data_dict[f"{c}_homer"] = homer_motifs
        meme_file = get_meme_file(store_dir, ko, c)
        meme_motifs = get_meme_top_motifs(meme_file)
        data_dict[f"{c}_meme"] = meme_motifs
    df = pd.DataFrame(data=data_dict, columns=[f"{c}_{method}" for c in categories for method in ["homer", "meme"]])
    return df




# ATF2

In [4]:
atf2_df = create_ko_specific_df(store_dir, ko_lines[0], categories)

In [5]:
atf2_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,Klf9(Zf)/GBM-Klf9-ChIP-Seq(GSE62211)/Homer,TBX3_HUMAN.H11MO.0.C,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A
1,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,Rbpj1(?)/Panc1-Rbpj1-ChIP-Seq(GSE47459)/Homer,TBX21_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P73_HUMAN.H11MO.0.A
2,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,KLF10(Zf)/HEK293-KLF10.GFP-ChIP-Seq(GSE58341)/...,SUH_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,P63_HUMAN.H11MO.0.A
3,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,TYY1_HUMAN.H11MO.0.A,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,ATF4_HUMAN.H11MO.0.A,KLF6(Zf)/PDAC-KLF6-ChIP-Seq(GSE64557)/Homer,KLF5_HUMAN.H11MO.0.A,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,ATF4_HUMAN.H11MO.0.A
4,YY1(Zf)/Promoter/Homer,CEBPG_HUMAN.H11MO.0.B,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,CEBPG_HUMAN.H11MO.0.B,Sp1(Zf)/Promoter/Homer,KLF1_HUMAN.H11MO.0.A,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,CEBPG_HUMAN.H11MO.0.B
5,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ATF4_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ZIC1_HUMAN.H11MO.0.B,Klf4(Zf)/mES-Klf4-ChIP-Seq(GSE11431)/Homer,SALL4_HUMAN.H11MO.0.B,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,SRY_HUMAN.H11MO.0.B
6,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,FOS_HUMAN.H11MO.0.A,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,FEV_HUMAN.H11MO.0.B,Sp2(Zf)/HEK293-Sp2.eGFP-ChIP-Seq(Encode)/Homer,EGR2_HUMAN.H11MO.0.A,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,DBP_HUMAN.H11MO.0.B
7,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,JUNB_HUMAN.H11MO.0.A,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,SMAD3_HUMAN.H11MO.0.B,VRN1(ABI3VP1)/col-VRN1-DAP-Seq(GSE60143)/Homer,KLF9_HUMAN.H11MO.0.C,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,CDX1_HUMAN.H11MO.0.C
8,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,FOSB_HUMAN.H11MO.0.A,CEBP:AP1(bZIP)/ThioMac-CEBPb-ChIP-Seq(GSE21512...,KLF6_HUMAN.H11MO.0.A,KLF1(Zf)/HUDEP2-KLF1-CutnRun(GSE136251)/Homer,KLF6_HUMAN.H11MO.0.A,ZFX(Zf)/mES-Zfx-ChIP-Seq(GSE11431)/Homer,FOXO4_HUMAN.H11MO.0.C
9,Atf1(bZIP)/K562-ATF1-ChIP-Seq(GSE31477)/Homer,FOSL1_HUMAN.H11MO.0.A,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,SUH_HUMAN.H11MO.0.A,Sp5(Zf)/mES-Sp5.Flag-ChIP-Seq(GSE72989)/Homer,ITF2_HUMAN.H11MO.0.C,ZNF711(Zf)/SHSY5Y-ZNF711-ChIP-Seq(GSE20673)/Homer,PRDM6_HUMAN.H11MO.0.C


# CTCF

In [6]:
ctcf_df = create_ko_specific_df(store_dir, ko_lines[1], categories)
ctcf_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,THAP1_HUMAN.H11MO.0.C,FAR1(FAR1)/col-FAR1-DAP-Seq(GSE60143)/Homer,SP2_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,CEBPG_HUMAN.H11MO.0.B
1,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,SP2_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,SP3_HUMAN.H11MO.0.B,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,SRY_HUMAN.H11MO.0.B
2,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,SP3_HUMAN.H11MO.0.B,p53(p53)/Saos-p53-ChIP-Seq/Homer,ZIC1_HUMAN.H11MO.0.B,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,ATF4_HUMAN.H11MO.0.A
3,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,CEBPG_HUMAN.H11MO.0.B,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,AP2B_HUMAN.H11MO.0.B,Klf9(Zf)/GBM-Klf9-ChIP-Seq(GSE62211)/Homer,AP2B_HUMAN.H11MO.0.B,TGA1(bZIP)/colamp-TGA1-DAP-Seq(GSE60143)/Homer,GATA3_HUMAN.H11MO.0.A
4,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ATF4_HUMAN.H11MO.0.A,TGA5(bZIP)/col-TGA5-DAP-Seq(GSE60143)/Homer,KLF3_HUMAN.H11MO.0.B,Zic2(Zf)/ESC-Zic2-ChIP-Seq(SRP197560)/Homer,KLF3_HUMAN.H11MO.0.B,TGA5(bZIP)/col-TGA5-DAP-Seq(GSE60143)/Homer,DBP_HUMAN.H11MO.0.B
5,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,TYY1_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,E2F4_HUMAN.H11MO.0.A,ANAC094(NAC)/col-ANAC094-DAP-Seq(GSE60143)/Homer,KLF6_HUMAN.H11MO.0.A,c-Jun-CRE(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/H...,PRDM6_HUMAN.H11MO.0.C
6,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,ZFP42_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,KLF6_HUMAN.H11MO.0.A,Unknown-ESC-element(?)/mES-Nanog-ChIP-Seq(GSE1...,SALL4_HUMAN.H11MO.0.B,Atf2(bZIP)/3T3L1-Atf2-ChIP-Seq(GSE56872)/Homer,CDX1_HUMAN.H11MO.0.C
7,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,THAP1_HUMAN.H11MO.0.C,CREB5(bZIP)/LNCaP-CREB5.V5-ChIP-Seq(GSE137775)...,KLF12_HUMAN.H11MO.0.C,IBL1(bHLH)/Seedling-IBL1-ChIP-Seq(GSE51120)/Homer,KLF1_HUMAN.H11MO.0.A,JunD(bZIP)/K562-JunD-ChIP-Seq/Homer,FOXK1_HUMAN.H11MO.0.A
8,YY1(Zf)/Promoter/Homer,ZFX_HUMAN.H11MO.0.A,Atf1(bZIP)/K562-ATF1-ChIP-Seq(GSE31477)/Homer,SP1_HUMAN.H11MO.0.A,KLF14(Zf)/HEK293-KLF14.GFP-ChIP-Seq(GSE58341)/...,KLF12_HUMAN.H11MO.0.C,Atf1(bZIP)/K562-ATF1-ChIP-Seq(GSE31477)/Homer,ZN394_HUMAN.H11MO.0.C
9,CEBP:AP1(bZIP)/ThioMac-CEBPb-ChIP-Seq(GSE21512...,CEBPD_HUMAN.H11MO.0.C,JunD(bZIP)/K562-JunD-ChIP-Seq/Homer,MECP2_HUMAN.H11MO.0.C,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,KLF5_HUMAN.H11MO.0.A,Atf7(bZIP)/3T3L1-Atf7-ChIP-Seq(GSE56872)/Homer,NF2L1_HUMAN.H11MO.0.C


# FOXA1

In [7]:
foxa1_df = create_ko_specific_df(store_dir, ko_lines[2], categories)
foxa1_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,THAP1_HUMAN.H11MO.0.C,Atf7(bZIP)/3T3L1-Atf7-ChIP-Seq(GSE56872)/Homer,SP3_HUMAN.H11MO.0.B,Elf4(ETS)/BMDM-Elf4-ChIP-Seq(GSE88699)/Homer,SRY_HUMAN.H11MO.0.B
1,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,SP2_HUMAN.H11MO.0.A,c-Jun-CRE(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/H...,SP2_HUMAN.H11MO.0.A,ELF1(ETS)/Jurkat-ELF1-ChIP-Seq(SRA014231)/Homer,CDX1_HUMAN.H11MO.0.C
2,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,SP3_HUMAN.H11MO.0.B,Atf2(bZIP)/3T3L1-Atf2-ChIP-Seq(GSE56872)/Homer,KLF6_HUMAN.H11MO.0.A,ETV4(ETS)/HepG2-ETV4-ChIP-Seq(ENCODE)/Homer,PIT1_HUMAN.H11MO.0.C
3,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,CEBPG_HUMAN.H11MO.0.B,JunD(bZIP)/K562-JunD-ChIP-Seq/Homer,KLF3_HUMAN.H11MO.0.B,BORIS(Zf)/K562-CTCFL-ChIP-Seq(GSE32465)/Homer,AP2B_HUMAN.H11MO.0.B,ELF3(ETS)/PDAC-ELF3-ChIP-Seq(GSE64557)/Homer,FOXK1_HUMAN.H11MO.0.A
4,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ATF4_HUMAN.H11MO.0.A,TGA5(bZIP)/col-TGA5-DAP-Seq(GSE60143)/Homer,E2F4_HUMAN.H11MO.0.A,CRF10(AP2EREBP)/col100-CRF10-DAP-Seq(GSE60143)...,KLF3_HUMAN.H11MO.0.B,ELF5(ETS)/T47D-ELF5-ChIP-Seq(GSE30407)/Homer,PRDM6_HUMAN.H11MO.0.C
5,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ATF2_HUMAN.H11MO.0.B,Jun-AP1(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/Homer,AP2B_HUMAN.H11MO.0.B,SeqBias: A/T bias,SALL4_HUMAN.H11MO.0.B,GABPA(ETS)/Jurkat-GABPa-ChIP-Seq(GSE17954)/Homer,PRRX2_HUMAN.H11MO.0.C
6,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,CREB1_HUMAN.H11MO.0.A,Fosl2(bZIP)/3T3L1-Fosl2-ChIP-Seq(GSE56872)/Homer,MECP2_HUMAN.H11MO.0.C,SeqBias: CG-repeat,ZIC1_HUMAN.H11MO.0.B,Elk1(ETS)/Hela-Elk1-ChIP-Seq(GSE31477)/Homer,GATA3_HUMAN.H11MO.0.A
7,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,ATF1_HUMAN.H11MO.0.B,c-Jun-CRE(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/H...,SP1_HUMAN.H11MO.0.A,CREB5(bZIP)/LNCaP-CREB5.V5-ChIP-Seq(GSE137775)...,SRBP2_HUMAN.H11MO.0.B,Fli1(ETS)/CD8-FLI-ChIP-Seq(GSE20898)/Homer,TBP_HUMAN.H11MO.0.A
8,TGA5(bZIP)/col-TGA5-DAP-Seq(GSE60143)/Homer,ATF3_HUMAN.H11MO.0.A,TGA3(bZIP)/colamp-TGA3-DAP-Seq(GSE60143)/Homer,KLF6_HUMAN.H11MO.0.A,JunD(bZIP)/K562-JunD-ChIP-Seq/Homer,KLF5_HUMAN.H11MO.0.A,SPDEF(ETS)/VCaP-SPDEF-ChIP-Seq(SRA014231)/Homer,SOX5_HUMAN.H11MO.0.C
9,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,TYY1_HUMAN.H11MO.0.A,Atf2(bZIP)/3T3L1-Atf2-ChIP-Seq(GSE56872)/Homer,KLF12_HUMAN.H11MO.0.C,STZ(C2H2)/colamp-STZ-DAP-Seq(GSE60143)/Homer,SP4_HUMAN.H11MO.0.A,PU.1(ETS)/ThioMac-PU.1-ChIP-Seq(GSE21512)/Homer,IRF7_HUMAN.H11MO.0.C


# LEF1

In [8]:
lef1_df = create_ko_specific_df(store_dir, ko_lines[3], categories)
lef1_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ATF4_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P53_HUMAN.H11MO.0.A,Fosl2(bZIP)/3T3L1-Fosl2-ChIP-Seq(GSE56872)/Homer,FOSL2_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P53_HUMAN.H11MO.0.A
1,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,CEBPG_HUMAN.H11MO.0.B,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,Jun-AP1(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/Homer,FOS_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A
2,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,CREB1_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P63_HUMAN.H11MO.0.A,JunB(bZIP)/DendriticCells-Junb-ChIP-Seq(GSE360...,JUNB_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P63_HUMAN.H11MO.0.A
3,TGA5(bZIP)/col-TGA5-DAP-Seq(GSE60143)/Homer,ATF2_HUMAN.H11MO.0.B,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,CEBPG_HUMAN.H11MO.0.B,Fra2(bZIP)/Striatum-Fra2-ChIP-Seq(GSE43429)/Homer,FOSB_HUMAN.H11MO.0.A,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,LYL1_HUMAN.H11MO.0.A
4,JunD(bZIP)/K562-JunD-ChIP-Seq/Homer,ATF1_HUMAN.H11MO.0.B,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ATF4_HUMAN.H11MO.0.A,BATF(bZIP)/Th17-BATF-ChIP-Seq(GSE39756)/Homer,JUN_HUMAN.H11MO.0.A,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ATF4_HUMAN.H11MO.0.A
5,Atf1(bZIP)/K562-ATF1-ChIP-Seq(GSE31477)/Homer,TYY1_HUMAN.H11MO.0.A,Fosl2(bZIP)/3T3L1-Fosl2-ChIP-Seq(GSE56872)/Homer,FOSL1_HUMAN.H11MO.0.A,Fos(bZIP)/TSC-Fos-ChIP-Seq(GSE110950)/Homer,JUND_HUMAN.H11MO.0.A,Tcfcp2l1(CP2)/mES-Tcfcp2l1-ChIP-Seq(GSE11431)/...,CEBPG_HUMAN.H11MO.0.B
6,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,THAP1_HUMAN.H11MO.0.C,Jun-AP1(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/Homer,FOSL2_HUMAN.H11MO.0.A,Fra1(bZIP)/BT549-Fra1-ChIP-Seq(GSE46166)/Homer,FOSL1_HUMAN.H11MO.0.A,ZNF416(Zf)/HEK293-ZNF416.GFP-ChIP-Seq(GSE58341...,SMAD3_HUMAN.H11MO.0.B
7,TGA1(bZIP)/colamp-TGA1-DAP-Seq(GSE60143)/Homer,ATF3_HUMAN.H11MO.0.A,Fra2(bZIP)/Striatum-Fra2-ChIP-Seq(GSE43429)/Homer,JUND_HUMAN.H11MO.0.A,Atf3(bZIP)/GBM-ATF3-ChIP-Seq(GSE33912)/Homer,E2F4_HUMAN.H11MO.0.A,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,NKX21_HUMAN.H11MO.0.A
8,CREB5(bZIP)/LNCaP-CREB5.V5-ChIP-Seq(GSE137775)...,FOSL1_HUMAN.H11MO.0.A,AP-1(bZIP)/ThioMac-PU.1-ChIP-Seq(GSE21512)/Homer,JUN_HUMAN.H11MO.0.A,AP-1(bZIP)/ThioMac-PU.1-ChIP-Seq(GSE21512)/Homer,NF2L1_HUMAN.H11MO.0.C,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,OLIG2_HUMAN.H11MO.0.B
9,c-Jun-CRE(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/H...,JUN_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,JUNB_HUMAN.H11MO.0.A,Bach2(bZIP)/OCILy7-Bach2-ChIP-Seq(GSE44420)/Homer,ZBT14_HUMAN.H11MO.0.C,CEBP:AP1(bZIP)/ThioMac-CEBPb-ChIP-Seq(GSE21512...,TGIF1_HUMAN.H11MO.0.A


# SCRT1

In [9]:
scrt1_df = create_ko_specific_df(store_dir, ko_lines[4], categories)
scrt1_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P53_HUMAN.H11MO.0.A,,P53_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ATF4_HUMAN.H11MO.0.A
1,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,P63_HUMAN.H11MO.0.A,,P73_HUMAN.H11MO.0.A,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,CEBPG_HUMAN.H11MO.0.B
2,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P73_HUMAN.H11MO.0.A,,P63_HUMAN.H11MO.0.A,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,CEBPB_HUMAN.H11MO.0.A
3,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,CEBPG_HUMAN.H11MO.0.B,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,ZN449_HUMAN.H11MO.0.C,,ZBT48_HUMAN.H11MO.0.C,CEBP:AP1(bZIP)/ThioMac-CEBPb-ChIP-Seq(GSE21512...,DBP_HUMAN.H11MO.0.B
4,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ATF4_HUMAN.H11MO.0.A,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,SMAD3_HUMAN.H11MO.0.B,,ZFX_HUMAN.H11MO.0.A,HLF(bZIP)/HSC-HLF.Flag-ChIP-Seq(GSE69817)/Homer,CREB1_HUMAN.H11MO.0.A
5,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,TYY1_HUMAN.H11MO.0.A,Tcfcp2l1(CP2)/mES-Tcfcp2l1-ChIP-Seq(GSE11431)/...,SRBP1_HUMAN.H11MO.0.A,,ZSC31_HUMAN.H11MO.0.C,Gata4(Zf)/Heart-Gata4-ChIP-Seq(GSE35151)/Homer,HLF_HUMAN.H11MO.0.C
6,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,ZFX_HUMAN.H11MO.0.A,ZNF416(Zf)/HEK293-ZNF416.GFP-ChIP-Seq(GSE58341...,THAP1_HUMAN.H11MO.0.C,,ZN667_HUMAN.H11MO.0.C,Gata2(Zf)/K562-GATA2-ChIP-Seq(GSE18829)/Homer,ATF1_HUMAN.H11MO.0.B
7,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,CEBPD_HUMAN.H11MO.0.C,Zfp809(Zf)/ES-Zfp809-ChIP-Seq(GSE70799)/Homer,E2F3_HUMAN.H11MO.0.A,,COT1_HUMAN.H11MO.0.C,Gata6(Zf)/HUG1N-GATA6-ChIP-Seq(GSE51936)/Homer,NKX31_HUMAN.H11MO.0.C
8,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,CEBPB_HUMAN.H11MO.0.A,RBFox2(?)/Heart-RBFox2-CLIP-Seq(GSE57926)/Homer,SP3_HUMAN.H11MO.0.B,,PAX6_HUMAN.H11MO.0.C,PBX1(Homeobox)/MCF7-PBX1-ChIP-Seq(GSE28007)/Homer,NKX61_HUMAN.H11MO.0.B
9,Tcfcp2l1(CP2)/mES-Tcfcp2l1-ChIP-Seq(GSE11431)/...,ATF2_HUMAN.H11MO.0.B,NRF(NRF)/Promoter/Homer,SALL4_HUMAN.H11MO.0.B,,E2F4_HUMAN.H11MO.0.A,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,GATA2_HUMAN.H11MO.0.A


# TCF7L2

In [10]:
tcf7l2_df = create_ko_specific_df(store_dir, ko_lines[5], categories)
tcf7l2_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,CEBPG_HUMAN.H11MO.0.B,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,CEBPG_HUMAN.H11MO.0.B,Slug(Zf)/Mesoderm-Snai2-ChIP-Seq(GSE61475)/Homer,SNAI2_HUMAN.H11MO.0.A
1,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,ATF4_HUMAN.H11MO.0.A,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ATF4_HUMAN.H11MO.0.A,"E2A(bHLH),near_PU.1/Bcell-PU.1-ChIP-Seq(GSE215...",SNAI1_HUMAN.H11MO.0.C
2,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,P53_HUMAN.H11MO.0.A,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,JUN_HUMAN.H11MO.0.A,Snail1(Zf)/LS174T-SNAIL1.HA-ChIP-Seq(GSE127183...,ASCL1_HUMAN.H11MO.0.A
3,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,CEBPG_HUMAN.H11MO.0.B,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P63_HUMAN.H11MO.0.A,c-Myc(bHLH)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,NF2L1_HUMAN.H11MO.0.C,Ascl2(bHLH)/ESC-Ascl2-ChIP-Seq(GSE97712)/Homer,TFE2_HUMAN.H11MO.0.A
4,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,ATF4_HUMAN.H11MO.0.A,Jun-AP1(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/Homer,JUN_HUMAN.H11MO.0.A,Fos(bZIP)/TSC-Fos-ChIP-Seq(GSE110950)/Homer,BATF_HUMAN.H11MO.0.A,Ascl1(bHLH)/NeuralTubes-Ascl1-ChIP-Seq(GSE5584...,MYOD1_HUMAN.H11MO.0.A
5,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,TYY1_HUMAN.H11MO.0.A,Fosl2(bZIP)/3T3L1-Fosl2-ChIP-Seq(GSE56872)/Homer,JUND_HUMAN.H11MO.0.A,Jun-AP1(bZIP)/K562-cJun-ChIP-Seq(GSE31477)/Homer,FOSL1_HUMAN.H11MO.0.A,NGA4(ABI3VP1)/col-NGA4-DAP-Seq(GSE60143)/Homer,ITF2_HUMAN.H11MO.0.C
6,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,ATF2_HUMAN.H11MO.0.B,Atf7(bZIP)/3T3L1-Atf7-ChIP-Seq(GSE56872)/Homer,P73_HUMAN.H11MO.0.A,JunB(bZIP)/DendriticCells-Junb-ChIP-Seq(GSE360...,JUND_HUMAN.H11MO.0.A,NeuroG2(bHLH)/Fibroblast-NeuroG2-ChIP-Seq(GSE7...,NDF2_HUMAN.H11MO.0.B
7,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,CREB1_HUMAN.H11MO.0.A,Fos(bZIP)/TSC-Fos-ChIP-Seq(GSE110950)/Homer,FOSL2_HUMAN.H11MO.0.A,Atf3(bZIP)/GBM-ATF3-ChIP-Seq(GSE33912)/Homer,FOSL2_HUMAN.H11MO.0.A,Ptf1a(bHLH)/Panc1-Ptf1a-ChIP-Seq(GSE47459)/Homer,HTF4_HUMAN.H11MO.0.A
8,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,ATF1_HUMAN.H11MO.0.B,Atf1(bZIP)/K562-ATF1-ChIP-Seq(GSE31477)/Homer,FOSL1_HUMAN.H11MO.0.A,Fra2(bZIP)/Striatum-Fra2-ChIP-Seq(GSE43429)/Homer,SRY_HUMAN.H11MO.0.B,ARF16(ARF)/col-ARF16-DAP-Seq(GSE60143)/Homer,BHA15_HUMAN.H11MO.0.B
9,TGA5(bZIP)/col-TGA5-DAP-Seq(GSE60143)/Homer,ZFP42_HUMAN.H11MO.0.A,CREB5(bZIP)/LNCaP-CREB5.V5-ChIP-Seq(GSE137775)...,FOSB_HUMAN.H11MO.0.A,Fra1(bZIP)/BT549-Fra1-ChIP-Seq(GSE46166)/Homer,CDX1_HUMAN.H11MO.0.C,ZEB1(Zf)/PDAC-ZEB1-ChIP-Seq(GSE64557)/Homer,MYOG_HUMAN.H11MO.0.B


# 16p12.1

In [11]:
cnv_df = create_ko_specific_df(store_dir, ko_lines[6], categories)
cnv_df

Unnamed: 0,peaks_vs_notpeaks_homer,peaks_vs_notpeaks_meme,responsive_vs_nonresponsive_homer,responsive_vs_nonresponsive_meme,induced_vs_repressed_homer,induced_vs_repressed_meme,repressed_vs_induced_homer,repressed_vs_induced_meme
0,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P53_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,ZFX_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P53_HUMAN.H11MO.0.A,ZFX(Zf)/mES-Zfx-ChIP-Seq(GSE11431)/Homer,ZFX_HUMAN.H11MO.0.A
1,p53(p53)/Saos-p53-ChIP-Seq(GSE15780)/Homer,P63_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,P53_HUMAN.H11MO.0.A,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,ERF8(AP2EREBP)/colamp-ERF8-DAP-Seq(GSE60143)/H...,AP2B_HUMAN.H11MO.0.B
2,p53(p53)/Saos-p53-ChIP-Seq/Homer,P73_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P73_HUMAN.H11MO.0.A,p73(p53)/Trachea-p73-ChIP-Seq(PRJNA310161)/Homer,P63_HUMAN.H11MO.0.A,Zfp281(Zf)/ES-Zfp281-ChIP-Seq(GSE81042)/Homer,KLF6_HUMAN.H11MO.0.A
3,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,CEBPG_HUMAN.H11MO.0.B,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,P63_HUMAN.H11MO.0.A,p63(p53)/Keratinocyte-p63-ChIP-Seq(GSE17611)/H...,CDX1_HUMAN.H11MO.0.C,Zic3(Zf)/mES-Zic3-ChIP-Seq(GSE37889)/Homer,SP2_HUMAN.H11MO.0.A
4,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ATF4_HUMAN.H11MO.0.A,ZFX(Zf)/mES-Zfx-ChIP-Seq(GSE11431)/Homer,AP2B_HUMAN.H11MO.0.B,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,SRY_HUMAN.H11MO.0.B,ERF9(AP2EREBP)/colamp-ERF9-DAP-Seq(GSE60143)/H...,SP3_HUMAN.H11MO.0.B
5,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,TYY1_HUMAN.H11MO.0.A,ZNF711(Zf)/SHSY5Y-ZNF711-ChIP-Seq(GSE20673)/Homer,SP2_HUMAN.H11MO.0.A,Nrf2(bZIP)/Lymphoblast-Nrf2-ChIP-Seq(GSE37589)...,HXA9_HUMAN.H11MO.0.B,ZNF711(Zf)/SHSY5Y-ZNF711-ChIP-Seq(GSE20673)/Homer,PATZ1_HUMAN.H11MO.0.C
6,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,ZFP42_HUMAN.H11MO.0.A,p53(p53)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,THAP1_HUMAN.H11MO.0.C,NF-E2(bZIP)/K562-NFE2-ChIP-Seq(GSE31477)/Homer,PRDM6_HUMAN.H11MO.0.C,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,SALL4_HUMAN.H11MO.0.B
7,Atf4(bZIP)/MEF-Atf4-ChIP-Seq(GSE35681)/Homer,CREB1_HUMAN.H11MO.0.A,Tcfcp2l1(CP2)/mES-Tcfcp2l1-ChIP-Seq(GSE11431)/...,SP3_HUMAN.H11MO.0.B,Bach2(bZIP)/OCILy7-Bach2-ChIP-Seq(GSE44420)/Homer,HXB13_HUMAN.H11MO.0.A,RKD2(RWPRK)/colamp-RKD2-DAP-Seq(GSE60143)/Homer,ZIC1_HUMAN.H11MO.0.B
8,NFIL3(bZIP)/HepG2-NFIL3-ChIP-Seq(Encode)/Homer,ATF2_HUMAN.H11MO.0.B,Chop(bZIP)/MEF-Chop-ChIP-Seq(GSE35681)/Homer,ZIC1_HUMAN.H11MO.0.B,Fos(bZIP)/TSC-Fos-ChIP-Seq(GSE110950)/Homer,PIT1_HUMAN.H11MO.0.C,Rap210(AP2EREBP)/col-Rap210-DAP-Seq(GSE60143)/...,ITF2_HUMAN.H11MO.0.C
9,YY1(Zf)/Promoter/Homer,CEBPD_HUMAN.H11MO.0.C,AARE(HLH)/mES-cMyc-ChIP-Seq/Homer,SRBP2_HUMAN.H11MO.0.B,c-Myc(bHLH)/mES-cMyc-ChIP-Seq(GSE11431)/Homer,ANDR_HUMAN.H11MO.0.A,AT1G12630(AP2EREBP)/colamp-AT1G12630-DAP-Seq(G...,SRBP2_HUMAN.H11MO.0.B
