In [1]:
import sys
sys.path.append("..")
from MPRA_predict.utils import *
from MPRA_predict.datasets import *
from MPRA_predict.metrics import *

from collections import Counter
import re

pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', 100)
pd.set_option('display.width', 1000)
pd.set_option('display.precision', 3)
np.set_printoptions(linewidth=1000)

In [2]:
sei_supp_table_1 = pd.read_excel('../data/Sei/41588_2022_1102_MOESM3_ESM.xlsx', sheet_name='Supp Table 1', skiprows=1)
sei_supp_table_1

Unnamed: 0,Chromatin Profile,AUROC,AUPRC
0,HeLa_Epithelium_Cervix | BTAF1 | ID:1,0.983,0.033
1,H9_Embryonic_Stem_Cell_Embryo | EOMES | ID:1006,0.963,0.380
2,H9_Embryonic_Stem_Cell_Embryo | EP300 | ID:1007,0.987,0.516
3,H9_Embryonic_Stem_Cell_Embryo | FOXH1 | ID:1010,0.954,0.207
4,H9_Embryonic_Stem_Cell_Embryo | FOXH1 | ID:1011,0.962,0.135
...,...,...,...
21902,WERI-Rb-1 | CTCF | ENCODE,0.997,0.665
21903,WERI-Rb-1 | DNase | ENCODE,0.968,0.386
21904,WI-38 | CTCF | ENCODE,0.997,0.686
21905,WI-38 (4OHTAM_20nM_72hr) | DNase | ENCODE,0.963,0.385


In [3]:
sei_supp_table_1[['cell_name', 'assay', 'source', 'part']] = (
    sei_supp_table_1['Chromatin Profile']
    .str.split(r"\s*\|\s*", n=3, expand=True)
)
sei_supp_table_1['index'] = sei_supp_table_1.index
sei_supp_table_1

Unnamed: 0,Chromatin Profile,AUROC,AUPRC,cell_name,assay,source,part,index
0,HeLa_Epithelium_Cervix | BTAF1 | ID:1,0.983,0.033,HeLa_Epithelium_Cervix,BTAF1,ID:1,,0
1,H9_Embryonic_Stem_Cell_Embryo | EOMES | ID:1006,0.963,0.380,H9_Embryonic_Stem_Cell_Embryo,EOMES,ID:1006,,1
2,H9_Embryonic_Stem_Cell_Embryo | EP300 | ID:1007,0.987,0.516,H9_Embryonic_Stem_Cell_Embryo,EP300,ID:1007,,2
3,H9_Embryonic_Stem_Cell_Embryo | FOXH1 | ID:1010,0.954,0.207,H9_Embryonic_Stem_Cell_Embryo,FOXH1,ID:1010,,3
4,H9_Embryonic_Stem_Cell_Embryo | FOXH1 | ID:1011,0.962,0.135,H9_Embryonic_Stem_Cell_Embryo,FOXH1,ID:1011,,4
...,...,...,...,...,...,...,...,...
21902,WERI-Rb-1 | CTCF | ENCODE,0.997,0.665,WERI-Rb-1,CTCF,ENCODE,,21902
21903,WERI-Rb-1 | DNase | ENCODE,0.968,0.386,WERI-Rb-1,DNase,ENCODE,,21903
21904,WI-38 | CTCF | ENCODE,0.997,0.686,WI-38,CTCF,ENCODE,,21904
21905,WI-38 (4OHTAM_20nM_72hr) | DNase | ENCODE,0.963,0.385,WI-38 (4OHTAM_20nM_72hr),DNase,ENCODE,,21905


In [4]:
sei_supp_table_2 = pd.read_excel('../data/Sei/41588_2022_1102_MOESM3_ESM.xlsx', sheet_name='Supp Table 2', skiprows=1)
sei_supp_table_2

Unnamed: 0,Original Cell Type Name,Standardized Celltype Name
0,1015c,1015c
1,10326,10326
2,1184_Stem_cell,1184_Stem_cell
3,133_Astrocyte,133_Astrocyte
4,143B_Osteosarcoma_cell,143B_Osteosarcoma_cell
...,...,...
1691,ZR-75-1_Breast,ZR-75-1
1692,ZR-75-1_Embryonic_Stem_Cell_Breast,ZR-75-1
1693,ZR-75-1_Epithelium_Mammary_Gland,ZR-75-1
1694,ZR-75-30,ZR-75-30_Epithelium_Mammary_Gland


In [5]:
cell_name_map_dict = sei_supp_table_2.set_index('Original Cell Type Name')['Standardized Celltype Name'].to_dict()
cell_name_map_dict

{'1015c': '1015c',
 '10326': '10326',
 '1184_Stem_cell': '1184_Stem_cell',
 '133_Astrocyte': '133_Astrocyte',
 '143B_Osteosarcoma_cell': '143B_Osteosarcoma_cell',
 '21NT_Epithelium_Breast': '21NT_Epithelium_Breast',
 '226LDM': '226LDM',
 '22RV1_Epithelium_Prostate': '22RV1',
 '293FT_Embryonic_Kidney': '293FT',
 '293T': '293T',
 '293T_Embryonic_Kidney': '293T',
 '293T-Rex': '293T-Rex',
 '3565_cells': '3565_cells',
 '451Lu_Melanoma_Cell': '451Lu_Melanoma_Cell',
 '4star': '4star',
 '501-Mel_melanoma': '501-Mel',
 '501-Mel_Melanoma_Cell': '501-Mel',
 '5637_Stem_cell': '5637_Stem_cell',
 '5637_Urinary_Bladder': '5637_Urinary_Bladder',
 '6540_cells_Epithelium': '6540_cells_Epithelium',
 '697_B-ALL': '697_B-ALL',
 '7250_Fibroblast': '7250_Fibroblast',
 '76NF2V_Breast': '76NF2V_Breast',
 '786-0_Kidney': '786-0_Kidney',
 '786-O_Epithelium_Kidney': '786-O_Epithelium_Kidney',
 '8988T': '8988T',
 '8988t_Epithelium_Pancreas': '8988T',
 '9.4_Neuron_Prefrontal': '9.4_Neuron_Prefrontal',
 '90-8TL_Schw

In [6]:
sei_supp_table_1['cell_type'] = sei_supp_table_1['cell_name'].map(cell_name_map_dict)
sei_supp_table_1

Unnamed: 0,Chromatin Profile,AUROC,AUPRC,cell_name,assay,source,part,index,cell_type
0,HeLa_Epithelium_Cervix | BTAF1 | ID:1,0.983,0.033,HeLa_Epithelium_Cervix,BTAF1,ID:1,,0,HeLa_Cervical_Carcinoma
1,H9_Embryonic_Stem_Cell_Embryo | EOMES | ID:1006,0.963,0.380,H9_Embryonic_Stem_Cell_Embryo,EOMES,ID:1006,,1,H9_Embryonic_Stem_Cell_Embryo
2,H9_Embryonic_Stem_Cell_Embryo | EP300 | ID:1007,0.987,0.516,H9_Embryonic_Stem_Cell_Embryo,EP300,ID:1007,,2,H9_Embryonic_Stem_Cell_Embryo
3,H9_Embryonic_Stem_Cell_Embryo | FOXH1 | ID:1010,0.954,0.207,H9_Embryonic_Stem_Cell_Embryo,FOXH1,ID:1010,,3,H9_Embryonic_Stem_Cell_Embryo
4,H9_Embryonic_Stem_Cell_Embryo | FOXH1 | ID:1011,0.962,0.135,H9_Embryonic_Stem_Cell_Embryo,FOXH1,ID:1011,,4,H9_Embryonic_Stem_Cell_Embryo
...,...,...,...,...,...,...,...,...,...
21902,WERI-Rb-1 | CTCF | ENCODE,0.997,0.665,WERI-Rb-1,CTCF,ENCODE,,21902,WERI-Rb-1_Eye
21903,WERI-Rb-1 | DNase | ENCODE,0.968,0.386,WERI-Rb-1,DNase,ENCODE,,21903,WERI-Rb-1_Eye
21904,WI-38 | CTCF | ENCODE,0.997,0.686,WI-38,CTCF,ENCODE,,21904,WI-38_Fibroblast_Lung
21905,WI-38 (4OHTAM_20nM_72hr) | DNase | ENCODE,0.963,0.385,WI-38 (4OHTAM_20nM_72hr),DNase,ENCODE,,21905,


In [7]:
df_pivot = sei_supp_table_1.pivot_table(
    values="index", 
    index="cell_type", 
    columns="assay", 
    aggfunc=list,
)

df_pivot

assay,ADNP,AEBP2,AFF1,AFF4,AGO1,AGO2,AHR,AHRR,AP-2alpha,AP-2gamma,APOBEC3B,AR,ARID1A,ARID2,ARID3A,ARID5B,ARNT,ARNT2,ARNTL,ARRB1,ASCL1,ASCL2,ASH1L,ASH2L,ASXL1,ATAC-seq,ATF1,ATF2,ATF3,ATF4,ATF5,ATF7IP,ATOH1,ATRX,AUTS2,BACH1,BACH2,BAF155,BAF170,BAHD1,BANF1,BANP,BARX1,BARX2,BATF,BATF3,BCAT1,BCL11A,BCL11B,BCL3,BCL6,BCLAF1,BCOR,BDP1,BHLHE40,BIRA,BMI1,BPTF,BRAF,BRCA1,BRD1,BRD2,BRD3,BRD4,BRD7,BRD9,BRDU,BRF1,BRF2,BRPF3,BTAF1,Bach1,Brg1,C11orf30,C17orf49,C17orf96,CAMTA2,CASP8AP2,CBFA2T2,CBFB,CBX1,CBX2,CBX3,CBX4,CBX5,CBX6,CBX7,CBX8,CCDC101,CCND2,CCNT2,CD59,CD74,CDC5L,CDCA2,CDK12,CDK2,CDK6,CDK7,CDK8,CDK9,CDX2,CEBPA,CEBPB,CEBPD,CEBPG,CEBPZ,CENPA,CENPC,CENPT,CHAMP1,CHAT,CHD1,CHD2,CHD4,CHD5,CHD7,CHD8,CHRM2,CIITA,CLOCK,CNOT3,COPS2,COREST,CPSF3L,CREB1,CREB3,CREB3L4,CREBBP,CREM,CRY1,CSDE1,CSNK2A1,CTBP1,CTBP2,CTCF,CTCFL,CTNNB1,CUX1,CtBP2,DACOR1,DAXX,DCP1A,DDX20,DDX21,DDX5,DEAF1,DEK,DIDO1,DLX1,DLX2,DMC1,DNMT1,DNMT3A,DNMT3B,DNase,DNase.all.peaks,DNase.fdr0.01.hot,DNase.fdr0.01.peaks,DNase.hot,DPF1,DPF2,DPPA2,DR1,DRAP1,DROSHA,DUX4,DYRK1A,E2F1,E2F2,E2F3,E2F4,E2F5,E2F6,E2F7,E2F8,EBF1,EBF3,EBNA1BP2,EBNA2,EBNA3,EBNA3C,EED,EGLN2,EGR1,EGR2,EGR3,EHF,EHMT2,ELF1,ELF2,ELF3,ELF5,ELK1,ELK3,ELK4,ELL2,EMSY,EMX1,EOMES,EP300,EP400,EPAS1,EPC1,EPO,ERCC2,ERCC3,ERCC6,ERF,ERG,ESCO2,ESR1,ESRRA,ETS1,ETS2,ETV1,ETV4,ETV5,ETV6,ETV7,EWSR1,EZH1,EZH2,Egr-1,FAIRE,FAM208A,FANCD2,FEV,FEZF1,FGFR1,FLI1,FOS,FOSL1,FOSL2,FOXA1,FOXA2,FOXD2,FOXG1,FOXH1,FOXJ2,FOXK1,FOXK2,FOXM1,FOXO1,FOXO3,FOXP1,FOXP2,FOXP3,FUS,FXR1,FXR2,GABP,GABPA,GAPDH,GATA-1,GATA-2,GATA1,GATA2,GATA3,GATA4,GATA6,GATAD1,GATAD2B,GFI1B,GLI2,GLI4,GLIS1,GLIS2,GLYR1,GMEB1,GMEB2,GPS2,GREB1,GRHL1,GRHL2,GRHL3,GRIP1,GRP20,GTF2A2,GTF2B,GTF2E2,GTF2F1,GTF2I,GTF3C2,GTF3C5,GUCY1B3,H1.0,H1.2,H1.4,H2A,H2A.Bbd,H2A.Z,H2A1,H2AFX,H2AFY,H2AFY2,H2AFZ,H2AK119,H2AK119ub,H2AK5ac,H2AK9ac,H2AX,H2AZ,"H2AZK4ac, H2AZK7ac, H2AZK11ac",H2AZac,H2B,H2BK120ac,H2BK120ub,H2BK12ac,H2BK15ac,H2BK20ac,H2BK5ac,H2Bub,H2Bub1,H3,H3.3,"H3.3,H2A.Z",H3/4ac,H3F3A,H3F3B,H3K122ac,H3K14ac,H3K18ac,H3K18cr,H3K23ac,H3K23me2,H3K27ac,H3K27me1,H3K27me2,H3K27me3,H3K27me3B,H3K36ac,H3K36me1,H3K36me2,H3K36me3,H3K36me3B,H3K4ac,H3K4me1,H3K4me2,H3K4me3,H3K4me3B,H3K56ac,H3K79me1,H3K79me2,H3K79me3,H3K9K14ac,H3K9ac,"H3K9ac, H3K14ac",H3K9me1,H3K9me2,H3K9me3,H3R26Cit,H3T,H3T11ph,H3ac,H4,H4K12ac,H4K16ac,H4K20me1,H4K20me3,H4K5ac,"H4K5ac, H4K8ac, H4K12ac, H4K16ac",H4K8ac,H4K91ac,H4ac,HA-E2F1,HAND1,HAND2,HBP1,HCFC1,HCFC1R1,HDAC1,HDAC2,HDAC3,HDAC4,HDAC6,HDAC8,HDGF,HECTD1,HES1,HES2,HEXIM1,HEY1,HEYL,HHEX,HIC1,HIF1A,HINFP,HIRA,HJURP,HLF,HLTF,HMBOX1,HMG20A,HMGN1,HMGN3,HNF1A,HNF1B,HNF4A,HNF4G,HNRNPLL,HOTAIR,HOXA1,HOXA11,HOXA13,HOXA2,HOXA4,HOXA6,HOXA9,HOXB13,HOXB7,HOXC9,HSF1,Histone Lysine Acetylation,Histone Lysine Crotonylation,ICE1,ICE2,ID3,IKZF1,IKZF2,ILK,ING2,ING5,INO80,INSM2,INTS11,INTS12,INTS3,IRAK1,IRAK4,IRF1,IRF2,IRF3,IRF4,IRF5,IRF9,Ini1,JARID1A,JARID2,JMJD1C,JMJD6,JUN,JUNB,JUND,JunD,KAP1,KAT2B,KAT5,KAT7,KAT8,KDM1A,KDM1B,KDM2B,KDM3A,KDM3B,KDM4A,KDM4B,KDM4C,KDM5A,KDM5B,KDM5C,KDM6A,KDM6B,KLF1,KLF10,KLF11,KLF12,KLF13,KLF15,KLF16,KLF17,KLF3,KLF4,KLF5,KLF6,KLF7,KLF8,KLF9,KMT2A,KMT2B,KMT2D,KRAB,L3MBTL2,L3MBTL4,LANA,LARP7,LDB1,LEF1,LEO1,LHX2,LIN9,LMNA,LMNB1,LMO1,LMO2,LMTK3,LRWD1,LYL1,MAF,MAFB,MAFF,MAFG,MAFK,MAML3,MAPK1,MAX,MAZ,MBD1_isoform1,MBD1_isoform2,MBD2,MBD3,MBD4,MBOAT4,MBTD1,MCM2,MCM3,MCM7,MCRS1,MDM2,MECOM,MECP2,MED1,MED12,MEF2A,MEF2B,MEF2C,MEF2D,MEIS1,MEN1,METTL14,MGEA5,MIER1,MITF,MKL1,MKL2,MLLT1,MLLT3,MNT,MORC2,MPHOSPH8,MRE11A,MTA2,MTA3,MTOR,MXD3,MXI1,MYB,MYBL2,MYC,MYCN,MYF5,MYH11,MYNN,MYOD1,MYOG,MZF1,MafF,MafK,Max,Mxi1,NANOG,NBN,NCAPG,NCAPG2,NCAPH2,NCOA1,NCOR1,NCOR2,NELFA,NELFE,NELFe,NEUROD1,NEUROG2,NF-E2,NF-YA,NF-YB,NFAT5,NFATC1,NFATC3,NFE2,NFE2L1,NFE2L2,NFIA,NFIC,NFIL3,NFKB1,NFKB2,NFRKB,NFYA,NFYB,NFYC,NIPBL,NKRF,NKX2-1,NKX2-2,NKX3-1,NME2,NONO,NOTCH1,NOTCH3,NPAT,NR0B1,NR1H2,NR1H3,NR2C2,NR2F1,NR2F2,NR2F6,NR3C1,NR4A1,NR5A2,NRF1,NRSF,NUP153,NUP98,NUP98-HOXA9,Nrf1,OGT,ORC1,ORC2,OSR2,OTX2,OVOL2,OVOL3,PAF1,PARP1,PATZ1,PAX3,PAX5,PAX5-C20,PAX5-N19,PAX6,PAX8,PBX1,PBX2,PBX3,PCGF1,PCGF2,PDX1,PGBD3,PGR,PHF2,PHF20,PHF6,PHF8,PHIP,PHOX2B,PIAS1,PIAS4,PITX3,PKNOX1,PLRG1,PLU1,PMEL,PML,POLR2A,POLR2AphosphoS5,POLR2B,POLR2H,POLR2M,POLR3A,POLR3D,POU2F1,POU2F2,POU3F2,POU5F1,PPARD,PPARG,PPARGC1A,PR,PRAME,PRDM1,PRDM10,PRDM11,PRDM12,PRDM14,PRDM2,PRDM6,PRKDC,PRMT1,PRMT5,PROX1,PRPF4,PSIP1,PSMD1,PTPA,PTPN11,PTRF,PTTG1,PU.1,PYGO2,Pbx3,Pol2,Pol2(b),Pol2(phosphoS2),Pol2-4H8,Pol3,RAC3,RAD21,RAD51,RAG2,RARA,RARG,RB1,RBBP5,RBCK1,RBL1,RBL2,RBP2,RBPJ,RCOR1,REL,RELA,RELB,REPIN1,REST,RFX1,RFX2,RFX5,RING1,RNF2,RPC155,RPE,RUNX1,RUNX1T1,RUNX2,RUNX3,RUVBL1,RUVBL2,RXRA,RXRG,RYBP,Rad21,SALL4,SAP30,SATB1,SCML2,SCRT1,SCRT2,SETD1A,SETDB1,SETX,SF1,SFMBT1,SFPQ,SIN3A,SIRT1,SIRT6,SIX1,SIX2,SIX4,SIX5,SKI,SMAD1,SMAD2,SMAD2/3,SMAD3,SMAD4,SMAD5,SMARCA2,SMARCA4,SMARCA5,SMARCB1,SMARCC1,SMARCC2,SMARCE1,SMC1A,SMC3,SMN1,SNAI2,SNAPC1,SNAPC2,SND1,SON,SOX10,SOX11,SOX13,SOX17,SOX2,SOX4,SOX9,SP1,SP140,SP2,SP3,SP4,SP7,SPDEF,SPI1,SPIB,SPIN1,SPT20,SRC,SRCAP,SREBF1,SREBF2,SRF,SRSF3,SS18,SSRP1,SSU72,STAG1,STAT1,STAT2,STAT3,STAT4,STAT5,STAT5A,STAT5B,SUMO1,SUMO2,SUPT5H,SUZ12,SVIL,Sin3Ak-20,T,TAF1,TAF3,TAF7,TAFII,TAL1,TARDBP,TAT,TAZ,TBL1X,TBL1XR1,TBLR1,TBP,TBX21,TBX5,TCF12,TCF21,TCF3,TCF4,TCF7,TCF7L1,TCF7L2,TCOF1,TDRD3,TEAD1,"TEAD1, TEAD4",TEAD2,TEAD4,TERC,TERF1,TERF2,TET1,TET2,TET3,TFAP2A,TFAP2C,TFAP4,TFDP1,TFIIIC-110,TGIF2,THAP1,THAP11,TLE3,TLX1,TOP1,TOP2B,TP53,TP63,TP73,TR4,TRAF7,TRIM22,TRIM24,TRIM25,TRIM28,TRRAP,TSC22D4,TSHZ1,TTF1,TTF2,U2AF1,UBE2I,UBF,UBTF,UHRF2,USF-1,USF1,USF2,USP49,USP7,VDR,VEZF1,WDHD1,WDR5,WHIP,WHSC1,WRNIP1,WT1,WWTR1,XBP1,XCL1,XRN2,YAP1,YBX1,YBX3,YY1,ZBED1,ZBTB1,ZBTB10,ZBTB11,ZBTB14,ZBTB16,ZBTB17,ZBTB18,ZBTB2,ZBTB26,ZBTB33,ZBTB40,ZBTB42,ZBTB48,ZBTB49,ZBTB6,ZBTB7A,ZBTB7B,ZBTB8A,ZC3H8,ZEB1,ZEB2,ZFAT,ZFP2,ZFP28,ZFP3,ZFP37,ZFP41,ZFP42,ZFP57,ZFP64,ZFP69,ZFP69B,ZFP90,ZFX,ZIC2,ZIM3,ZKSCAN1,ZKSCAN2,ZKSCAN5,ZKSCAN8,ZMIZ1,ZMYM3,ZMYND11,ZMYND8,ZNF10,ZNF100,ZNF101,ZNF12,ZNF121,ZNF124,ZNF131,ZNF133,ZNF134,ZNF135,ZNF136,ZNF138,ZNF140,ZNF141,ZNF143,ZNF146,ZNF157,ZNF16,ZNF169,ZNF17,ZNF175,ZNF18,ZNF180,ZNF182,ZNF189,ZNF197,ZNF2,ZNF202,ZNF207,ZNF217,ZNF22,ZNF222,ZNF239,ZNF24,ZNF248,ZNF254,ZNF257,ZNF26,ZNF260,ZNF263,ZNF264,ZNF266,ZNF267,ZNF273,ZNF274,ZNF28,ZNF280A,ZNF280D,ZNF281,ZNF282,ZNF284,ZNF287,ZNF292,ZNF30,ZNF304,ZNF317,ZNF318,ZNF320,ZNF322,ZNF324,ZNF329,ZNF331,ZNF333,ZNF334,ZNF335,ZNF337,ZNF33A,ZNF341,ZNF343,ZNF346,ZNF35,ZNF350,ZNF354A,ZNF354C,ZNF362,ZNF366,ZNF382,ZNF383,ZNF384,ZNF391,ZNF394,ZNF407,ZNF41,ZNF410,ZNF414,ZNF423,ZNF425,ZNF429,ZNF430,ZNF433,ZNF436,ZNF438,ZNF44,ZNF440,ZNF441,ZNF445,ZNF449,ZNF460,ZNF467,ZNF468,ZNF479,ZNF48,ZNF480,ZNF483,ZNF485,ZNF486,ZNF488,ZNF490,ZNF501,ZNF506,ZNF512,ZNF518A,ZNF519,ZNF528,ZNF530,ZNF534,ZNF543,ZNF547,ZNF549,ZNF554,ZNF555,ZNF557,ZNF558,ZNF561,ZNF563,ZNF565,ZNF567,ZNF573,ZNF574,ZNF580,ZNF584,ZNF585A,ZNF585B,ZNF586,ZNF589,ZNF592,ZNF597,ZNF600,ZNF605,ZNF610,ZNF611,ZNF616,ZNF618,ZNF623,ZNF627,ZNF639,ZNF641,ZNF644,ZNF649,ZNF654,ZNF664,ZNF671,ZNF674,ZNF675,ZNF680,ZNF682,ZNF687,ZNF692,ZNF695,ZNF697,ZNF701,ZNF707,ZNF708,ZNF71,ZNF711,ZNF714,ZNF716,ZNF730,ZNF736,ZNF740,ZNF750,ZNF75A,ZNF75D,ZNF76,ZNF765,ZNF766,ZNF768,ZNF770,ZNF777,ZNF778,ZNF780A,ZNF781,ZNF783,ZNF786,ZNF788,ZNF792,ZNF793,ZNF8,ZNF800,ZNF808,ZNF81,ZNF816,ZNF823,ZNF83,ZNF837,ZNF84,ZNF846,ZNF85,ZNF879,ZNF92,ZNF93,ZSCAN16,ZSCAN2,ZSCAN20,ZSCAN22,ZSCAN23,ZSCAN29,ZSCAN31,ZSCAN5A,ZTA,ZXDB,ZXDC,ZZZ3,Znf143,c-Fos,c-Jun,c-Myc,eGFP-FOS,eGFP-GATA2,eGFP-HDAC8,eGFP-JunB,eGFP-JunD,p300
cell_type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1,Unnamed: 289_level_1,Unnamed: 290_level_1,Unnamed: 291_level_1,Unnamed: 292_level_1,Unnamed: 293_level_1,Unnamed: 294_level_1,Unnamed: 295_level_1,Unnamed: 296_level_1,Unnamed: 297_level_1,Unnamed: 298_level_1,Unnamed: 299_level_1,Unnamed: 300_level_1,Unnamed: 301_level_1,Unnamed: 302_level_1,Unnamed: 303_level_1,Unnamed: 304_level_1,Unnamed: 305_level_1,Unnamed: 306_level_1,Unnamed: 307_level_1,Unnamed: 308_level_1,Unnamed: 309_level_1,Unnamed: 310_level_1,Unnamed: 311_level_1,Unnamed: 312_level_1,Unnamed: 313_level_1,Unnamed: 314_level_1,Unnamed: 315_level_1,Unnamed: 316_level_1,Unnamed: 317_level_1,Unnamed: 318_level_1,Unnamed: 319_level_1,Unnamed: 320_level_1,Unnamed: 321_level_1,Unnamed: 322_level_1,Unnamed: 323_level_1,Unnamed: 324_level_1,Unnamed: 325_level_1,Unnamed: 326_level_1,Unnamed: 327_level_1,Unnamed: 328_level_1,Unnamed: 329_level_1,Unnamed: 330_level_1,Unnamed: 331_level_1,Unnamed: 332_level_1,Unnamed: 333_level_1,Unnamed: 334_level_1,Unnamed: 335_level_1,Unnamed: 336_level_1,Unnamed: 337_level_1,Unnamed: 338_level_1,Unnamed: 339_level_1,Unnamed: 340_level_1,Unnamed: 341_level_1,Unnamed: 342_level_1,Unnamed: 343_level_1,Unnamed: 344_level_1,Unnamed: 345_level_1,Unnamed: 346_level_1,Unnamed: 347_level_1,Unnamed: 348_level_1,Unnamed: 349_level_1,Unnamed: 350_level_1,Unnamed: 351_level_1,Unnamed: 352_level_1,Unnamed: 353_level_1,Unnamed: 354_level_1,Unnamed: 355_level_1,Unnamed: 356_level_1,Unnamed: 357_level_1,Unnamed: 358_level_1,Unnamed: 359_level_1,Unnamed: 360_level_1,Unnamed: 361_level_1,Unnamed: 362_level_1,Unnamed: 363_level_1,Unnamed: 364_level_1,Unnamed: 365_level_1,Unnamed: 366_level_1,Unnamed: 367_level_1,Unnamed: 368_level_1,Unnamed: 369_level_1,Unnamed: 370_level_1,Unnamed: 371_level_1,Unnamed: 372_level_1,Unnamed: 373_level_1,Unnamed: 374_level_1,Unnamed: 375_level_1,Unnamed: 376_level_1,Unnamed: 377_level_1,Unnamed: 378_level_1,Unnamed: 379_level_1,Unnamed: 380_level_1,Unnamed: 381_level_1,Unnamed: 382_level_1,Unnamed: 383_level_1,Unnamed: 384_level_1,Unnamed: 385_level_1,Unnamed: 386_level_1,Unnamed: 387_level_1,Unnamed: 388_level_1,Unnamed: 389_level_1,Unnamed: 390_level_1,Unnamed: 391_level_1,Unnamed: 392_level_1,Unnamed: 393_level_1,Unnamed: 394_level_1,Unnamed: 395_level_1,Unnamed: 396_level_1,Unnamed: 397_level_1,Unnamed: 398_level_1,Unnamed: 399_level_1,Unnamed: 400_level_1,Unnamed: 401_level_1,Unnamed: 402_level_1,Unnamed: 403_level_1,Unnamed: 404_level_1,Unnamed: 405_level_1,Unnamed: 406_level_1,Unnamed: 407_level_1,Unnamed: 408_level_1,Unnamed: 409_level_1,Unnamed: 410_level_1,Unnamed: 411_level_1,Unnamed: 412_level_1,Unnamed: 413_level_1,Unnamed: 414_level_1,Unnamed: 415_level_1,Unnamed: 416_level_1,Unnamed: 417_level_1,Unnamed: 418_level_1,Unnamed: 419_level_1,Unnamed: 420_level_1,Unnamed: 421_level_1,Unnamed: 422_level_1,Unnamed: 423_level_1,Unnamed: 424_level_1,Unnamed: 425_level_1,Unnamed: 426_level_1,Unnamed: 427_level_1,Unnamed: 428_level_1,Unnamed: 429_level_1,Unnamed: 430_level_1,Unnamed: 431_level_1,Unnamed: 432_level_1,Unnamed: 433_level_1,Unnamed: 434_level_1,Unnamed: 435_level_1,Unnamed: 436_level_1,Unnamed: 437_level_1,Unnamed: 438_level_1,Unnamed: 439_level_1,Unnamed: 440_level_1,Unnamed: 441_level_1,Unnamed: 442_level_1,Unnamed: 443_level_1,Unnamed: 444_level_1,Unnamed: 445_level_1,Unnamed: 446_level_1,Unnamed: 447_level_1,Unnamed: 448_level_1,Unnamed: 449_level_1,Unnamed: 450_level_1,Unnamed: 451_level_1,Unnamed: 452_level_1,Unnamed: 453_level_1,Unnamed: 454_level_1,Unnamed: 455_level_1,Unnamed: 456_level_1,Unnamed: 457_level_1,Unnamed: 458_level_1,Unnamed: 459_level_1,Unnamed: 460_level_1,Unnamed: 461_level_1,Unnamed: 462_level_1,Unnamed: 463_level_1,Unnamed: 464_level_1,Unnamed: 465_level_1,Unnamed: 466_level_1,Unnamed: 467_level_1,Unnamed: 468_level_1,Unnamed: 469_level_1,Unnamed: 470_level_1,Unnamed: 471_level_1,Unnamed: 472_level_1,Unnamed: 473_level_1,Unnamed: 474_level_1,Unnamed: 475_level_1,Unnamed: 476_level_1,Unnamed: 477_level_1,Unnamed: 478_level_1,Unnamed: 479_level_1,Unnamed: 480_level_1,Unnamed: 481_level_1,Unnamed: 482_level_1,Unnamed: 483_level_1,Unnamed: 484_level_1,Unnamed: 485_level_1,Unnamed: 486_level_1,Unnamed: 487_level_1,Unnamed: 488_level_1,Unnamed: 489_level_1,Unnamed: 490_level_1,Unnamed: 491_level_1,Unnamed: 492_level_1,Unnamed: 493_level_1,Unnamed: 494_level_1,Unnamed: 495_level_1,Unnamed: 496_level_1,Unnamed: 497_level_1,Unnamed: 498_level_1,Unnamed: 499_level_1,Unnamed: 500_level_1,Unnamed: 501_level_1,Unnamed: 502_level_1,Unnamed: 503_level_1,Unnamed: 504_level_1,Unnamed: 505_level_1,Unnamed: 506_level_1,Unnamed: 507_level_1,Unnamed: 508_level_1,Unnamed: 509_level_1,Unnamed: 510_level_1,Unnamed: 511_level_1,Unnamed: 512_level_1,Unnamed: 513_level_1,Unnamed: 514_level_1,Unnamed: 515_level_1,Unnamed: 516_level_1,Unnamed: 517_level_1,Unnamed: 518_level_1,Unnamed: 519_level_1,Unnamed: 520_level_1,Unnamed: 521_level_1,Unnamed: 522_level_1,Unnamed: 523_level_1,Unnamed: 524_level_1,Unnamed: 525_level_1,Unnamed: 526_level_1,Unnamed: 527_level_1,Unnamed: 528_level_1,Unnamed: 529_level_1,Unnamed: 530_level_1,Unnamed: 531_level_1,Unnamed: 532_level_1,Unnamed: 533_level_1,Unnamed: 534_level_1,Unnamed: 535_level_1,Unnamed: 536_level_1,Unnamed: 537_level_1,Unnamed: 538_level_1,Unnamed: 539_level_1,Unnamed: 540_level_1,Unnamed: 541_level_1,Unnamed: 542_level_1,Unnamed: 543_level_1,Unnamed: 544_level_1,Unnamed: 545_level_1,Unnamed: 546_level_1,Unnamed: 547_level_1,Unnamed: 548_level_1,Unnamed: 549_level_1,Unnamed: 550_level_1,Unnamed: 551_level_1,Unnamed: 552_level_1,Unnamed: 553_level_1,Unnamed: 554_level_1,Unnamed: 555_level_1,Unnamed: 556_level_1,Unnamed: 557_level_1,Unnamed: 558_level_1,Unnamed: 559_level_1,Unnamed: 560_level_1,Unnamed: 561_level_1,Unnamed: 562_level_1,Unnamed: 563_level_1,Unnamed: 564_level_1,Unnamed: 565_level_1,Unnamed: 566_level_1,Unnamed: 567_level_1,Unnamed: 568_level_1,Unnamed: 569_level_1,Unnamed: 570_level_1,Unnamed: 571_level_1,Unnamed: 572_level_1,Unnamed: 573_level_1,Unnamed: 574_level_1,Unnamed: 575_level_1,Unnamed: 576_level_1,Unnamed: 577_level_1,Unnamed: 578_level_1,Unnamed: 579_level_1,Unnamed: 580_level_1,Unnamed: 581_level_1,Unnamed: 582_level_1,Unnamed: 583_level_1,Unnamed: 584_level_1,Unnamed: 585_level_1,Unnamed: 586_level_1,Unnamed: 587_level_1,Unnamed: 588_level_1,Unnamed: 589_level_1,Unnamed: 590_level_1,Unnamed: 591_level_1,Unnamed: 592_level_1,Unnamed: 593_level_1,Unnamed: 594_level_1,Unnamed: 595_level_1,Unnamed: 596_level_1,Unnamed: 597_level_1,Unnamed: 598_level_1,Unnamed: 599_level_1,Unnamed: 600_level_1,Unnamed: 601_level_1,Unnamed: 602_level_1,Unnamed: 603_level_1,Unnamed: 604_level_1,Unnamed: 605_level_1,Unnamed: 606_level_1,Unnamed: 607_level_1,Unnamed: 608_level_1,Unnamed: 609_level_1,Unnamed: 610_level_1,Unnamed: 611_level_1,Unnamed: 612_level_1,Unnamed: 613_level_1,Unnamed: 614_level_1,Unnamed: 615_level_1,Unnamed: 616_level_1,Unnamed: 617_level_1,Unnamed: 618_level_1,Unnamed: 619_level_1,Unnamed: 620_level_1,Unnamed: 621_level_1,Unnamed: 622_level_1,Unnamed: 623_level_1,Unnamed: 624_level_1,Unnamed: 625_level_1,Unnamed: 626_level_1,Unnamed: 627_level_1,Unnamed: 628_level_1,Unnamed: 629_level_1,Unnamed: 630_level_1,Unnamed: 631_level_1,Unnamed: 632_level_1,Unnamed: 633_level_1,Unnamed: 634_level_1,Unnamed: 635_level_1,Unnamed: 636_level_1,Unnamed: 637_level_1,Unnamed: 638_level_1,Unnamed: 639_level_1,Unnamed: 640_level_1,Unnamed: 641_level_1,Unnamed: 642_level_1,Unnamed: 643_level_1,Unnamed: 644_level_1,Unnamed: 645_level_1,Unnamed: 646_level_1,Unnamed: 647_level_1,Unnamed: 648_level_1,Unnamed: 649_level_1,Unnamed: 650_level_1,Unnamed: 651_level_1,Unnamed: 652_level_1,Unnamed: 653_level_1,Unnamed: 654_level_1,Unnamed: 655_level_1,Unnamed: 656_level_1,Unnamed: 657_level_1,Unnamed: 658_level_1,Unnamed: 659_level_1,Unnamed: 660_level_1,Unnamed: 661_level_1,Unnamed: 662_level_1,Unnamed: 663_level_1,Unnamed: 664_level_1,Unnamed: 665_level_1,Unnamed: 666_level_1,Unnamed: 667_level_1,Unnamed: 668_level_1,Unnamed: 669_level_1,Unnamed: 670_level_1,Unnamed: 671_level_1,Unnamed: 672_level_1,Unnamed: 673_level_1,Unnamed: 674_level_1,Unnamed: 675_level_1,Unnamed: 676_level_1,Unnamed: 677_level_1,Unnamed: 678_level_1,Unnamed: 679_level_1,Unnamed: 680_level_1,Unnamed: 681_level_1,Unnamed: 682_level_1,Unnamed: 683_level_1,Unnamed: 684_level_1,Unnamed: 685_level_1,Unnamed: 686_level_1,Unnamed: 687_level_1,Unnamed: 688_level_1,Unnamed: 689_level_1,Unnamed: 690_level_1,Unnamed: 691_level_1,Unnamed: 692_level_1,Unnamed: 693_level_1,Unnamed: 694_level_1,Unnamed: 695_level_1,Unnamed: 696_level_1,Unnamed: 697_level_1,Unnamed: 698_level_1,Unnamed: 699_level_1,Unnamed: 700_level_1,Unnamed: 701_level_1,Unnamed: 702_level_1,Unnamed: 703_level_1,Unnamed: 704_level_1,Unnamed: 705_level_1,Unnamed: 706_level_1,Unnamed: 707_level_1,Unnamed: 708_level_1,Unnamed: 709_level_1,Unnamed: 710_level_1,Unnamed: 711_level_1,Unnamed: 712_level_1,Unnamed: 713_level_1,Unnamed: 714_level_1,Unnamed: 715_level_1,Unnamed: 716_level_1,Unnamed: 717_level_1,Unnamed: 718_level_1,Unnamed: 719_level_1,Unnamed: 720_level_1,Unnamed: 721_level_1,Unnamed: 722_level_1,Unnamed: 723_level_1,Unnamed: 724_level_1,Unnamed: 725_level_1,Unnamed: 726_level_1,Unnamed: 727_level_1,Unnamed: 728_level_1,Unnamed: 729_level_1,Unnamed: 730_level_1,Unnamed: 731_level_1,Unnamed: 732_level_1,Unnamed: 733_level_1,Unnamed: 734_level_1,Unnamed: 735_level_1,Unnamed: 736_level_1,Unnamed: 737_level_1,Unnamed: 738_level_1,Unnamed: 739_level_1,Unnamed: 740_level_1,Unnamed: 741_level_1,Unnamed: 742_level_1,Unnamed: 743_level_1,Unnamed: 744_level_1,Unnamed: 745_level_1,Unnamed: 746_level_1,Unnamed: 747_level_1,Unnamed: 748_level_1,Unnamed: 749_level_1,Unnamed: 750_level_1,Unnamed: 751_level_1,Unnamed: 752_level_1,Unnamed: 753_level_1,Unnamed: 754_level_1,Unnamed: 755_level_1,Unnamed: 756_level_1,Unnamed: 757_level_1,Unnamed: 758_level_1,Unnamed: 759_level_1,Unnamed: 760_level_1,Unnamed: 761_level_1,Unnamed: 762_level_1,Unnamed: 763_level_1,Unnamed: 764_level_1,Unnamed: 765_level_1,Unnamed: 766_level_1,Unnamed: 767_level_1,Unnamed: 768_level_1,Unnamed: 769_level_1,Unnamed: 770_level_1,Unnamed: 771_level_1,Unnamed: 772_level_1,Unnamed: 773_level_1,Unnamed: 774_level_1,Unnamed: 775_level_1,Unnamed: 776_level_1,Unnamed: 777_level_1,Unnamed: 778_level_1,Unnamed: 779_level_1,Unnamed: 780_level_1,Unnamed: 781_level_1,Unnamed: 782_level_1,Unnamed: 783_level_1,Unnamed: 784_level_1,Unnamed: 785_level_1,Unnamed: 786_level_1,Unnamed: 787_level_1,Unnamed: 788_level_1,Unnamed: 789_level_1,Unnamed: 790_level_1,Unnamed: 791_level_1,Unnamed: 792_level_1,Unnamed: 793_level_1,Unnamed: 794_level_1,Unnamed: 795_level_1,Unnamed: 796_level_1,Unnamed: 797_level_1,Unnamed: 798_level_1,Unnamed: 799_level_1,Unnamed: 800_level_1,Unnamed: 801_level_1,Unnamed: 802_level_1,Unnamed: 803_level_1,Unnamed: 804_level_1,Unnamed: 805_level_1,Unnamed: 806_level_1,Unnamed: 807_level_1,Unnamed: 808_level_1,Unnamed: 809_level_1,Unnamed: 810_level_1,Unnamed: 811_level_1,Unnamed: 812_level_1,Unnamed: 813_level_1,Unnamed: 814_level_1,Unnamed: 815_level_1,Unnamed: 816_level_1,Unnamed: 817_level_1,Unnamed: 818_level_1,Unnamed: 819_level_1,Unnamed: 820_level_1,Unnamed: 821_level_1,Unnamed: 822_level_1,Unnamed: 823_level_1,Unnamed: 824_level_1,Unnamed: 825_level_1,Unnamed: 826_level_1,Unnamed: 827_level_1,Unnamed: 828_level_1,Unnamed: 829_level_1,Unnamed: 830_level_1,Unnamed: 831_level_1,Unnamed: 832_level_1,Unnamed: 833_level_1,Unnamed: 834_level_1,Unnamed: 835_level_1,Unnamed: 836_level_1,Unnamed: 837_level_1,Unnamed: 838_level_1,Unnamed: 839_level_1,Unnamed: 840_level_1,Unnamed: 841_level_1,Unnamed: 842_level_1,Unnamed: 843_level_1,Unnamed: 844_level_1,Unnamed: 845_level_1,Unnamed: 846_level_1,Unnamed: 847_level_1,Unnamed: 848_level_1,Unnamed: 849_level_1,Unnamed: 850_level_1,Unnamed: 851_level_1,Unnamed: 852_level_1,Unnamed: 853_level_1,Unnamed: 854_level_1,Unnamed: 855_level_1,Unnamed: 856_level_1,Unnamed: 857_level_1,Unnamed: 858_level_1,Unnamed: 859_level_1,Unnamed: 860_level_1,Unnamed: 861_level_1,Unnamed: 862_level_1,Unnamed: 863_level_1,Unnamed: 864_level_1,Unnamed: 865_level_1,Unnamed: 866_level_1,Unnamed: 867_level_1,Unnamed: 868_level_1,Unnamed: 869_level_1,Unnamed: 870_level_1,Unnamed: 871_level_1,Unnamed: 872_level_1,Unnamed: 873_level_1,Unnamed: 874_level_1,Unnamed: 875_level_1,Unnamed: 876_level_1,Unnamed: 877_level_1,Unnamed: 878_level_1,Unnamed: 879_level_1,Unnamed: 880_level_1,Unnamed: 881_level_1,Unnamed: 882_level_1,Unnamed: 883_level_1,Unnamed: 884_level_1,Unnamed: 885_level_1,Unnamed: 886_level_1,Unnamed: 887_level_1,Unnamed: 888_level_1,Unnamed: 889_level_1,Unnamed: 890_level_1,Unnamed: 891_level_1,Unnamed: 892_level_1,Unnamed: 893_level_1,Unnamed: 894_level_1,Unnamed: 895_level_1,Unnamed: 896_level_1,Unnamed: 897_level_1,Unnamed: 898_level_1,Unnamed: 899_level_1,Unnamed: 900_level_1,Unnamed: 901_level_1,Unnamed: 902_level_1,Unnamed: 903_level_1,Unnamed: 904_level_1,Unnamed: 905_level_1,Unnamed: 906_level_1,Unnamed: 907_level_1,Unnamed: 908_level_1,Unnamed: 909_level_1,Unnamed: 910_level_1,Unnamed: 911_level_1,Unnamed: 912_level_1,Unnamed: 913_level_1,Unnamed: 914_level_1,Unnamed: 915_level_1,Unnamed: 916_level_1,Unnamed: 917_level_1,Unnamed: 918_level_1,Unnamed: 919_level_1,Unnamed: 920_level_1,Unnamed: 921_level_1,Unnamed: 922_level_1,Unnamed: 923_level_1,Unnamed: 924_level_1,Unnamed: 925_level_1,Unnamed: 926_level_1,Unnamed: 927_level_1,Unnamed: 928_level_1,Unnamed: 929_level_1,Unnamed: 930_level_1,Unnamed: 931_level_1,Unnamed: 932_level_1,Unnamed: 933_level_1,Unnamed: 934_level_1,Unnamed: 935_level_1,Unnamed: 936_level_1,Unnamed: 937_level_1,Unnamed: 938_level_1,Unnamed: 939_level_1,Unnamed: 940_level_1,Unnamed: 941_level_1,Unnamed: 942_level_1,Unnamed: 943_level_1,Unnamed: 944_level_1,Unnamed: 945_level_1,Unnamed: 946_level_1,Unnamed: 947_level_1,Unnamed: 948_level_1,Unnamed: 949_level_1,Unnamed: 950_level_1,Unnamed: 951_level_1,Unnamed: 952_level_1,Unnamed: 953_level_1,Unnamed: 954_level_1,Unnamed: 955_level_1,Unnamed: 956_level_1,Unnamed: 957_level_1,Unnamed: 958_level_1,Unnamed: 959_level_1,Unnamed: 960_level_1,Unnamed: 961_level_1,Unnamed: 962_level_1,Unnamed: 963_level_1,Unnamed: 964_level_1,Unnamed: 965_level_1,Unnamed: 966_level_1,Unnamed: 967_level_1,Unnamed: 968_level_1,Unnamed: 969_level_1,Unnamed: 970_level_1,Unnamed: 971_level_1,Unnamed: 972_level_1,Unnamed: 973_level_1,Unnamed: 974_level_1,Unnamed: 975_level_1,Unnamed: 976_level_1,Unnamed: 977_level_1,Unnamed: 978_level_1,Unnamed: 979_level_1,Unnamed: 980_level_1,Unnamed: 981_level_1,Unnamed: 982_level_1,Unnamed: 983_level_1,Unnamed: 984_level_1,Unnamed: 985_level_1,Unnamed: 986_level_1,Unnamed: 987_level_1,Unnamed: 988_level_1,Unnamed: 989_level_1,Unnamed: 990_level_1,Unnamed: 991_level_1,Unnamed: 992_level_1,Unnamed: 993_level_1,Unnamed: 994_level_1,Unnamed: 995_level_1,Unnamed: 996_level_1,Unnamed: 997_level_1,Unnamed: 998_level_1,Unnamed: 999_level_1,Unnamed: 1000_level_1,Unnamed: 1001_level_1,Unnamed: 1002_level_1,Unnamed: 1003_level_1,Unnamed: 1004_level_1,Unnamed: 1005_level_1,Unnamed: 1006_level_1,Unnamed: 1007_level_1,Unnamed: 1008_level_1,Unnamed: 1009_level_1,Unnamed: 1010_level_1,Unnamed: 1011_level_1,Unnamed: 1012_level_1,Unnamed: 1013_level_1,Unnamed: 1014_level_1,Unnamed: 1015_level_1,Unnamed: 1016_level_1,Unnamed: 1017_level_1,Unnamed: 1018_level_1,Unnamed: 1019_level_1,Unnamed: 1020_level_1,Unnamed: 1021_level_1,Unnamed: 1022_level_1,Unnamed: 1023_level_1,Unnamed: 1024_level_1,Unnamed: 1025_level_1,Unnamed: 1026_level_1,Unnamed: 1027_level_1,Unnamed: 1028_level_1,Unnamed: 1029_level_1,Unnamed: 1030_level_1,Unnamed: 1031_level_1,Unnamed: 1032_level_1,Unnamed: 1033_level_1,Unnamed: 1034_level_1,Unnamed: 1035_level_1,Unnamed: 1036_level_1,Unnamed: 1037_level_1,Unnamed: 1038_level_1,Unnamed: 1039_level_1,Unnamed: 1040_level_1,Unnamed: 1041_level_1,Unnamed: 1042_level_1,Unnamed: 1043_level_1,Unnamed: 1044_level_1,Unnamed: 1045_level_1,Unnamed: 1046_level_1,Unnamed: 1047_level_1,Unnamed: 1048_level_1,Unnamed: 1049_level_1,Unnamed: 1050_level_1,Unnamed: 1051_level_1,Unnamed: 1052_level_1,Unnamed: 1053_level_1,Unnamed: 1054_level_1,Unnamed: 1055_level_1,Unnamed: 1056_level_1,Unnamed: 1057_level_1,Unnamed: 1058_level_1,Unnamed: 1059_level_1,Unnamed: 1060_level_1,Unnamed: 1061_level_1,Unnamed: 1062_level_1,Unnamed: 1063_level_1,Unnamed: 1064_level_1,Unnamed: 1065_level_1,Unnamed: 1066_level_1,Unnamed: 1067_level_1,Unnamed: 1068_level_1,Unnamed: 1069_level_1,Unnamed: 1070_level_1,Unnamed: 1071_level_1,Unnamed: 1072_level_1,Unnamed: 1073_level_1,Unnamed: 1074_level_1,Unnamed: 1075_level_1,Unnamed: 1076_level_1,Unnamed: 1077_level_1,Unnamed: 1078_level_1,Unnamed: 1079_level_1,Unnamed: 1080_level_1,Unnamed: 1081_level_1,Unnamed: 1082_level_1,Unnamed: 1083_level_1,Unnamed: 1084_level_1,Unnamed: 1085_level_1,Unnamed: 1086_level_1,Unnamed: 1087_level_1,Unnamed: 1088_level_1,Unnamed: 1089_level_1,Unnamed: 1090_level_1,Unnamed: 1091_level_1,Unnamed: 1092_level_1,Unnamed: 1093_level_1,Unnamed: 1094_level_1,Unnamed: 1095_level_1,Unnamed: 1096_level_1,Unnamed: 1097_level_1,Unnamed: 1098_level_1,Unnamed: 1099_level_1,Unnamed: 1100_level_1,Unnamed: 1101_level_1,Unnamed: 1102_level_1,Unnamed: 1103_level_1,Unnamed: 1104_level_1,Unnamed: 1105_level_1,Unnamed: 1106_level_1,Unnamed: 1107_level_1,Unnamed: 1108_level_1,Unnamed: 1109_level_1,Unnamed: 1110_level_1,Unnamed: 1111_level_1,Unnamed: 1112_level_1,Unnamed: 1113_level_1,Unnamed: 1114_level_1,Unnamed: 1115_level_1,Unnamed: 1116_level_1,Unnamed: 1117_level_1,Unnamed: 1118_level_1,Unnamed: 1119_level_1,Unnamed: 1120_level_1,Unnamed: 1121_level_1,Unnamed: 1122_level_1,Unnamed: 1123_level_1,Unnamed: 1124_level_1,Unnamed: 1125_level_1,Unnamed: 1126_level_1,Unnamed: 1127_level_1,Unnamed: 1128_level_1,Unnamed: 1129_level_1,Unnamed: 1130_level_1,Unnamed: 1131_level_1,Unnamed: 1132_level_1,Unnamed: 1133_level_1,Unnamed: 1134_level_1,Unnamed: 1135_level_1,Unnamed: 1136_level_1,Unnamed: 1137_level_1,Unnamed: 1138_level_1,Unnamed: 1139_level_1,Unnamed: 1140_level_1,Unnamed: 1141_level_1,Unnamed: 1142_level_1,Unnamed: 1143_level_1,Unnamed: 1144_level_1,Unnamed: 1145_level_1,Unnamed: 1146_level_1,Unnamed: 1147_level_1,Unnamed: 1148_level_1,Unnamed: 1149_level_1,Unnamed: 1150_level_1,Unnamed: 1151_level_1,Unnamed: 1152_level_1,Unnamed: 1153_level_1,Unnamed: 1154_level_1,Unnamed: 1155_level_1,Unnamed: 1156_level_1,Unnamed: 1157_level_1,Unnamed: 1158_level_1,Unnamed: 1159_level_1,Unnamed: 1160_level_1,Unnamed: 1161_level_1,Unnamed: 1162_level_1,Unnamed: 1163_level_1,Unnamed: 1164_level_1,Unnamed: 1165_level_1,Unnamed: 1166_level_1,Unnamed: 1167_level_1,Unnamed: 1168_level_1,Unnamed: 1169_level_1
1015c,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[8996],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[8998],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
10326,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[8997],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1184_Stem_cell,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,"[17304, 17847, 18648, 19156, 19793]",,,,,,,,,,"[17193, 17303, 17848, 18650, 19155, 19792]",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
133_Astrocyte,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,"[17620, 19226]",,,,,,,,,,"[17931, 19231]",,,,,,,,,,,[19121],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
143B_Osteosarcoma_cell,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[16932],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[17341],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[17391],,,,,,,,,,,[18629],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
inferior_parietal_cortex,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[12402],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
pHTE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[21751],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
superior_temporal_gyrus,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[11317],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
t(3;21)_paitent,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[16968],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [8]:
df_avail = df_pivot[['DNase', 'H3K4me3', 'H3K27ac', 'CTCF']]
df_avail = df_avail[(df_avail.isna().sum(axis=1) == 0)]
df_avail

assay,DNase,H3K4me3,H3K27ac,CTCF
cell_type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
A549,"[3147, 4493, 4494, 19920]","[1664, 1668, 2466, 2470, 2613, 2621, 2623, 471...","[2478, 2487, 4707, 4715, 10889, 10890, 10891, ...","[4704, 4706, 5075, 5076, 5081, 5083, 5563, 557..."
AG04450_Fibroblast_Fetal_Lung,"[4497, 19983]",[4724],[4725],"[5088, 5089, 19982]"
Astrocyte_Brain,"[3235, 4651, 4652]",[4991],[4993],[4986]
BE2-C,"[4506, 4507, 20000]","[4730, 9964, 18290]","[9233, 9238, 10592, 10593, 10632]","[5098, 5099, 19999]"
BJ_Fibroblast_Foreskin,"[4508, 4509, 7138, 10659, 10660, 10684, 10685,...","[4733, 14000, 14003, 14005, 14279]","[7961, 10582, 17690]","[5100, 5101, 20001]"
B_Lymphocyte_Blood,"[635, 3146, 4516, 4517]","[919, 4740, 4742, 7037]","[2052, 4281, 4282, 4741, 7637, 7638]",[4737]
Brain,"[10678, 10679, 10680, 16416]","[2324, 2325, 2327, 2443, 9384, 9388, 9391, 939...","[2205, 9371, 9372, 9373, 9374, 9375, 9376, 937...","[5104, 5519]"
Caco-2_Epithelium_Colon,"[4514, 4515, 16625, 20080]",[4735],[17327],"[5102, 5103, 20079]"
Embryonic_Stem_Cell_Embryo,[3016],"[1705, 2210, 4098, 4102, 4106, 6849, 6850, 6983]","[2204, 2212, 4099, 4103, 4107, 9947, 9948, 995...","[9949, 9950, 9957, 9958]"
Endothelial_Cell_Umbilical_Vein,"[1491, 3005, 3116, 3117, 3118, 3119, 3120, 312...","[1366, 1397, 2400, 2422, 4817, 4902, 4913, 637...","[940, 942, 1363, 1369, 1943, 2069, 2070, 2077,...","[1344, 1355, 4899, 5228, 5229, 5365, 5366, 537..."


In [9]:
print(len(df_avail))

61


In [17]:
assays = ['DNase', 'H3K4me3', 'H3K27ac', 'CTCF']
cell_types = ['K562', 'HepG2', 'SK-N-SH', 'A549', 'HCT116']
cell_types_standard_names = ['HepG2_Hepatocellular_Carcinoma', 'K562_Leukemia_Cell', 'SK-N-SH_Neuroblastoma_cell_Brain', 'A549', 'HCT-116_Colorectal_cancer_cell_line', 'SK-N-SH_RA_Neuron_Brain']

In [18]:
df_Sei_Siraj = df_pivot.loc[cell_types_standard_names][assays]
df_Sei_Siraj.map(lambda x: len(x) if isinstance(x, list) else 0)

assay,DNase,H3K4me3,H3K27ac,CTCF
cell_type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
HepG2_Hepatocellular_Carcinoma,9,8,9,17
K562_Leukemia_Cell,58,91,51,29
SK-N-SH_Neuroblastoma_cell_Brain,0,3,3,2
A549,4,45,53,10
HCT-116_Colorectal_cancer_cell_line,6,45,49,14
SK-N-SH_RA_Neuron_Brain,4,1,0,5


In [19]:
pred_array = np.load('../pretrained_models/Sei/Sei_Siraj_pred_562654.npy')
print(pred_array.shape)

(562654, 21907)


In [20]:
MPRA_df = pd.read_csv('../data/SirajMPRA/SirajMPRA_562654.csv')
print(MPRA_df.shape)

(562654, 15)


In [24]:
# average every channel

pred_feature_matrix = np.full(shape=(len(pred_array), len(cell_types), len(assays)), fill_value=np.nan)

pearson_df = pd.DataFrame(index=cell_types, columns=assays, dtype=float)

np.full(shape=(len(cell_types), len(assays)), fill_value=np.nan)

for i, cell_type in enumerate(cell_types):
    for j, assay in enumerate(assays):
        cell_name = cell_types_standard_names[i]
        if cell_type == 'SK-N-SH' and assay == 'DNase':
            # mannual select SK-N-SH_RA
            cell_name = 'SK-N-SH_RA_Neuron_Brain'

        indice = df_Sei_Siraj.loc[cell_name, assay]
        if indice is not None:
            predicted_feature = logit(pred_array[:, indice]).mean(1)
            pred_feature_matrix[:, i, j] = predicted_feature
            true_label = MPRA_df[cell_type]
            r, _ = pearson(predicted_feature, true_label)
            pearson_df.loc[cell_type, assay] = r
            
pearson_df

         DNase  H3K4me3  H3K27ac  CTCF
HepG2      NaN      NaN      NaN   NaN
K562       NaN      NaN      NaN   NaN
SK-N-SH    NaN      NaN      NaN   NaN
A549       NaN      NaN      NaN   NaN
HCT116     NaN      NaN      NaN   NaN


In [26]:
pearson_df

Unnamed: 0,DNase,H3K4me3,H3K27ac,CTCF
HepG2,0.443,0.469,0.427,0.35
K562,0.499,0.451,0.444,0.364
SK-N-SH,0.368,0.486,0.47,0.298
A549,0.348,0.362,0.363,0.247
HCT116,0.424,0.443,0.452,0.329


In [27]:
np.save('Sei_Siraj_pred_feature_matrix.npy', pred_feature_matrix)

In [37]:
###### if model is enformer

model_info_df = pd.read_excel('../data/Enformer/41592_2021_1252_MOESM3_ESM.xlsx', sheet_name='Supplementary Table 2')
model_info_df

Unnamed: 0,index,genome,identifier,file,clip,scale,sum_stat,description,assay_type,target,assay_subtype,DNASE: cell-type agnostic,CAGE: cell-type agnostic,CAGE: IRF6,CAGE: TERT-GBM,CAGE: ZFAND3,"CAGE: HNF4A,MSMB,TERT-HEK293T,MYCrs6983267","CAGE: GP1BB,HBB,HBG1,PKLR","CAGE: F9,LDLR,SORT1",DNASE: IRF4,DNASE: IRF6,DNASE: ZFAND3,"DNASE: HNF4A,MSMB,TERT-HEK293T,MYCrs6983267","DNASE: GP1BB,HBB,HBG1,PKLR","DNASE: F9,LDLR,SORT1"
0,0,0,ENCFF833POA,/home/drk/tillage/datasets/human/dnase/encode/...,32,2,mean,DNASE:cerebellum male adult (27 years) and mal...,DNASE,DNase/cerebellum male adult (27 years) and mal...,DNase,True,False,False,False,False,False,False,False,False,False,False,False,False,False
1,1,0,ENCFF110QGM,/home/drk/tillage/datasets/human/dnase/encode/...,32,2,mean,DNASE:frontal cortex male adult (27 years) and...,DNASE,DNase/frontal cortex male adult (27 years) and...,DNase,True,False,False,False,False,False,False,False,False,False,False,False,False,False
2,2,0,ENCFF880MKD,/home/drk/tillage/datasets/human/dnase/encode/...,32,2,mean,DNASE:chorion,DNASE,DNase/chorion,DNase,True,False,False,False,False,False,False,False,False,False,False,False,False,False
3,3,0,ENCFF463ZLQ,/home/drk/tillage/datasets/human/dnase/encode/...,32,2,mean,DNASE:Ishikawa treated with 0.02% dimethyl sul...,DNASE,DNase/Ishikawa treated with 0.02% dimethyl sul...,DNase,True,False,False,False,False,False,False,False,False,False,False,False,False,False
4,4,0,ENCFF890OGQ,/home/drk/tillage/datasets/human/dnase/encode/...,32,2,mean,DNASE:GM03348,DNASE,DNase/GM03348,DNase,True,False,False,False,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5308,5308,0,CNhs14239,/home/drk/tillage/datasets/human/cage/fantom/C...,384,1,sum,CAGE:epithelioid sarcoma cell line:HS-ES-2R,CAGE,CAGE/epithelioid sarcoma cell line:HS-ES-2R,CAGE,False,True,False,False,False,False,False,False,False,False,False,False,False,False
5309,5309,0,CNhs14240,/home/drk/tillage/datasets/human/cage/fantom/C...,384,1,sum,CAGE:squamous cell lung carcinoma cell line:RE...,CAGE,CAGE/squamous cell lung carcinoma cell line:RE...,CAGE,False,True,False,False,False,False,False,False,False,False,False,False,False,False
5310,5310,0,CNhs14241,/home/drk/tillage/datasets/human/cage/fantom/C...,384,1,sum,CAGE:gastric cancer cell line:GSS,CAGE,CAGE/gastric cancer cell line:GSS,CAGE,False,True,False,False,False,False,False,False,False,False,False,False,False,False
5311,5311,0,CNhs14244,/home/drk/tillage/datasets/human/cage/fantom/C...,384,1,sum,CAGE:carcinoid cell line:NCI-H727,CAGE,CAGE/carcinoid cell line:NCI-H727,CAGE,False,True,False,False,False,False,False,False,False,False,False,False,False,False


In [51]:
model_info_df = model_info_df[['index', 'target']].copy()
model_info_df[['assay', 'cell_type']] = model_info_df['target'].str.split('/', n=1, expand=True)
model_info_df['assay'] = model_info_df['assay'].str.replace('ChIP-Histone:', '').str.replace('ChIP-TF:', '')
model_info_df

Unnamed: 0,index,target,assay,cell_type
0,0,DNase/cerebellum male adult (27 years) and mal...,DNase,cerebellum male adult (27 years) and male adul...
1,1,DNase/frontal cortex male adult (27 years) and...,DNase,frontal cortex male adult (27 years) and male ...
2,2,DNase/chorion,DNase,chorion
3,3,DNase/Ishikawa treated with 0.02% dimethyl sul...,DNase,Ishikawa treated with 0.02% dimethyl sulfoxide...
4,4,DNase/GM03348,DNase,GM03348
...,...,...,...,...
5308,5308,CAGE/epithelioid sarcoma cell line:HS-ES-2R,CAGE,epithelioid sarcoma cell line:HS-ES-2R
5309,5309,CAGE/squamous cell lung carcinoma cell line:RE...,CAGE,squamous cell lung carcinoma cell line:RERF-LC-AI
5310,5310,CAGE/gastric cancer cell line:GSS,CAGE,gastric cancer cell line:GSS
5311,5311,CAGE/carcinoid cell line:NCI-H727,CAGE,carcinoid cell line:NCI-H727


In [52]:
df_pivot = model_info_df.pivot_table(
    values="index", 
    index="cell_type", 
    columns="assay", 
    aggfunc=list,
)
df_pivot

assay,.,3xFLAG-AHR,3xFLAG-ARID4B,3xFLAG-ATF1,3xFLAG-ATF4,3xFLAG-BCL6,3xFLAG-CEBPA,3xFLAG-CEBPG,3xFLAG-CREB1,3xFLAG-DMAP1,3xFLAG-DNMT3B,3xFLAG-DRAP1,3xFLAG-ELF3,3xFLAG-ERF,3xFLAG-ETV5,3xFLAG-FOXA3,3xFLAG-FOXP1,3xFLAG-GABPA,3xFLAG-GABPB1,3xFLAG-GATAD1,3xFLAG-GATAD2A,3xFLAG-GMEB2,3xFLAG-HBP1,3xFLAG-HHEX,3xFLAG-HLF,3xFLAG-HMG20A,3xFLAG-HMG20B,3xFLAG-HOMEZ,3xFLAG-IKZF5,3xFLAG-IRF2,3xFLAG-KAT7,3xFLAG-KAT8,3xFLAG-KDM1A,3xFLAG-KDM3A,3xFLAG-KDM6A,3xFLAG-KLF11,3xFLAG-KLF16,3xFLAG-KLF6,3xFLAG-KLF9,3xFLAG-KMT2B,3xFLAG-MBD1,3xFLAG-MIER2,3xFLAG-MIER3,3xFLAG-MIXL1,3xFLAG-MLX,3xFLAG-MXD3,3xFLAG-MXD4,3xFLAG-MYRF,3xFLAG-NFIA,3xFLAG-NFIL3,3xFLAG-NFKBIZ,3xFLAG-NFYC,3xFLAG-NR2F1,3xFLAG-NR2F6,3xFLAG-PAF1,3xFLAG-PBX2,3xFLAG-PHF5A,3xFLAG-PPARG,3xFLAG-RAD21,3xFLAG-RARA,3xFLAG-RBPJ,3xFLAG-RCOR2,3xFLAG-RERE,3xFLAG-RFX3,3xFLAG-RFXANK,3xFLAG-RXRB,3xFLAG-SAP130,3xFLAG-SLC30A9,3xFLAG-SMAD4,3xFLAG-SOX13,3xFLAG-SOX5,3xFLAG-SP5,3xFLAG-SSRP1,3xFLAG-TEAD1,3xFLAG-TEAD3,3xFLAG-TFE3,3xFLAG-TGIF2,3xFLAG-THAP11,3xFLAG-THRB,3xFLAG-ZBED5,3xFLAG-ZBTB25,3xFLAG-ZBTB26,3xFLAG-ZFP1,3xFLAG-ZFP64,3xFLAG-ZGPAT,3xFLAG-ZKSCAN8,3xFLAG-ZNF146,3xFLAG-ZNF205,3xFLAG-ZNF3,3xFLAG-ZNF48,3xFLAG-ZNF511,3xFLAG-ZNF580,3xFLAG-ZNF614,3xFLAG-ZNF639,3xFLAG-ZNF644,3xFLAG-ZNF652,3xFLAG-ZNF7,3xFLAG-ZNF792,3xFLAG-ZSCAN9,AFF1,AGO1,AGO2,ARHGAP35,ARID1B,ARID2,ARID3A,ARNT,ASH1L,ASH2L,ATAC,ATF2,ATF3,ATF4,ATF7,ATM,BACH1,BATF,BCL11A,BCL3,BCLAF1,BCOR,BHLHE40,BMAL1,BMI1,BRCA1,BRD4,BRD9,C11orf30,CAGE,CBFA2T2,CBFA2T3,CBFB,CBX1,CBX2,CBX3,CBX5,CBX8,CC2D1A,CCAR2,CDC5L,CEBPB,CEBPZ,CEBPb,CHAMP1,CHD1,CHD2,CHD4,CHD7,CLOCK,COPS2,CREB1,CREB3L1,CREBBP,CREM,CSDE1,CTBP1,CTBP2,CTCF,CUX1,DACH1,DDX20,DEAF1,DEK,DNMT1,DNase,DPF2,E2F1,E2F4,E2F6,E2F7,E2F8,E4F1,EBF1,EED,EGR1,EHMT2,ELF1,ELF4,ELK1,EP300,EP400,ESR1,ESRRA,ETS1,ETV4,ETV6,EWSR1,EZH2,EZH2phosphoT487,FIP1L1,FOS,FOSL1,FOSL2,FOXA1,FOXA2,FOXK2,FOXM1,FOXP1,FOXP2,FUS,GABPA,GABPB1,GATA1,GATA2,GATA3,GATA4,GATAD2A,GATAD2B,GMEB1,GR,GTF2F1,H2AFZ,H2AK5ac,H2AK9ac,H2BK120ac,H2BK12ac,H2BK15ac,H2BK20ac,H2BK5ac,H3F3A,H3K14ac,H3K18ac,H3K23ac,H3K23me2,H3K27Ac,H3K27ac,H3K27me3,H3K36me3,H3K4ac,H3K4me1,H3K4me2,H3K4me3,H3K56ac,H3K79me1,H3K79me2,H3K9ac,H3K9me1,H3K9me2,H3K9me3,H3T11ph,H4K12ac,H4K20me1,H4K5ac,H4K8ac,H4K91ac,HCFC1,HDAC1,HDAC2,HDAC3,HDAC6,HDGF,HES1,HLTF,HMBOX1,HNF1A,HNF4A,HNF4G,HNRNPH1,HNRNPK,HNRNPL,HNRNPLL,HNRNPUL1,HSF1,IKZF1,IKZF2,ILF3,IRF1,IRF2,IRF3,IRF4,IRF5,JUN,JUNB,JUND,KAT2A,KAT2B,KAT8,KDM1A,KDM4A,KDM4B,KDM5A,KDM5B,KHSRP,KLF16,KLF5,L3MBTL2,LARP7,LCORL,LEF1,MAFF,MAFK,MAX,MAZ,MBD2,MCM2,MCM3,MCM5,MCM7,MEF2A,MEF2B,MEF2C,MEIS2,MGA,MIER1,MITF,MLLT1,MNT,MTA1,MTA2,MTA3,MXI1,MYB,MYBL2,MYC,MYNN,NANOG,NBN,NCOA1,NCOA2,NCOA3,NCOA4,NCOA6,NCOR1,NEUROD1,NFATC1,NFATC3,NFE2,NFE2L2,NFIB,NFIC,NFRKB,NFXL1,NFYA,NFYB,NKRF,NONO,NR0B1,NR2C1,NR2C2,NR2F1,NR2F2,NR2F6,NR3C1,NRF1,NUFIP1,PAX5,PAX8,PBX3,PCBP1,PCBP2,PHB2,PHF20,PHF21A,PHF8,PKNOX1,PLRG1,PML,POLR2A,POLR2AphosphoS2,POLR2AphosphoS5,POLR2B,POLR2G,POU2F2,POU5F1,PPP1R10,PRDM10,PRPF4,PTBP1,PYGO2,RAD21,RAD51,RB1,RBBP5,RBFOX2,RBM14,RBM15,RBM17,RBM22,RBM25,RBM34,RBM39,RCOR1,RELB,REST,RFX1,RFX5,RLF,RNAPII,RNF2,RUNX1,RUNX3,RXRA,SAFB,SAFB2,SAP30,SETDB1,SFPQ,SIN3A,SIN3B,SIRT6,SIX4,SIX5,SKI,SKIL,SMAD1,SMAD2,SMAD5,SMARCA4,SMARCA5,SMARCB1,SMARCC2,SMARCE1,SMC3,SNIP1,SNRNP70,SOX13,SOX6,SP1,SPI1,SREBF1,SREBF2,SRF,SRSF1,SRSF3,SRSF4,SRSF7,SRSF9,STAT1,STAT2,STAT3,STAT5A,SUPT20H,SUPT5H,SUZ12,SYNCRIP,TAF1,TAF15,TAF7,TAF9B,TAL1,TARDBP,TBL1XR1,TBP,TBX21,TBX3,TCF12,TCF7,TCF7L2,TEAD4,TFAP4,THAP1,THRA,THRAP3,TOE1,TRIM22,TRIM24,TRIM25,TRIM28,TRIP13,U2AF1,U2AF2,UBTF,USF1,USF2,WHSC1,WRNIP1,XRCC3,XRCC5,YBX1,YBX3,YY1,ZBED1,ZBTB1,ZBTB11,ZBTB2,ZBTB33,ZBTB40,ZBTB5,ZBTB7A,ZBTB7B,ZBTB8A,ZC3H11A,ZC3H8,ZEB1,ZEB2,ZFP36,ZFP91,ZFX,ZHX1,ZHX2,ZKSCAN1,ZMIZ1,ZMYM3,ZNF143,ZNF184,ZNF207,ZNF217,ZNF24,ZNF263,ZNF274,ZNF280A,ZNF282,ZNF316,ZNF318,ZNF384,ZNF407,ZNF444,ZNF507,ZNF512B,ZNF574,ZNF579,ZNF592,ZNF622,ZNF639,ZNF687,ZNF8,ZNF830,ZSCAN29,ZZZ3,abcam,active,eGFP-ADNP,eGFP-AEBP2,eGFP-ATF1,eGFP-ATF2,eGFP-ATF3,eGFP-BACH1,eGFP-BCL11A,eGFP-BCL11B,eGFP-BCL6B,eGFP-CEBPB,eGFP-CEBPG,eGFP-CREB3,eGFP-CTCF,eGFP-CUX1,eGFP-DDX20,eGFP-DIDO1,eGFP-E2F4,eGFP-E2F5,eGFP-EGR2,eGFP-ELF1,eGFP-ETS2,eGFP-ETV1,eGFP-FEZF1,eGFP-FOSL1,eGFP-FOSL2,eGFP-FOXJ2,eGFP-GABPA,eGFP-GATA2,eGFP-GFI1B,eGFP-GLI2,eGFP-GLI4,eGFP-GLIS1,eGFP-GLIS2,eGFP-GTF2A2,eGFP-GTF2E2,eGFP-HDAC8,eGFP-HIC1,eGFP-HINFP,eGFP-ID3,eGFP-IKZF3,eGFP-ILK,eGFP-INSM2,eGFP-IRF1,eGFP-IRF9,eGFP-KLF1,eGFP-KLF10,eGFP-KLF13,eGFP-KLF14,eGFP-KLF16,eGFP-KLF17,eGFP-KLF4,eGFP-KLF7,eGFP-KLF8,eGFP-KLF9,eGFP-MAFG,eGFP-MAZ,eGFP-MEF2D,eGFP-MYNN,eGFP-MZF1,eGFP-NFE2,eGFP-NFE2L1,eGFP-NR2C1,eGFP-NR2C2,eGFP-NR4A1,eGFP-OSR2,eGFP-OVOL3,eGFP-PATZ1,eGFP-PBX2,eGFP-POLR2H,eGFP-PRDM1,eGFP-PRDM10,eGFP-PRDM12,eGFP-PRDM2,eGFP-PRDM4,eGFP-PRDM6,eGFP-PTRF,eGFP-PTTG1,eGFP-PYGO2,eGFP-RBAK,eGFP-RELA,eGFP-REPIN1,eGFP-REST,eGFP-SALL1,eGFP-SALL2,eGFP-SCRT1,eGFP-SCRT2,eGFP-SP2,eGFP-SP3,eGFP-SP7,eGFP-TAF7,eGFP-TEAD2,eGFP-TFDP1,eGFP-TSC22D4,eGFP-TSHZ1,eGFP-USF2,eGFP-VEZF1,eGFP-WT1,eGFP-YY1,eGFP-YY2,eGFP-ZBTB1,eGFP-ZBTB10,eGFP-ZBTB11,eGFP-ZBTB12,eGFP-ZBTB17,eGFP-ZBTB20,eGFP-ZBTB21,eGFP-ZBTB26,eGFP-ZBTB40,eGFP-ZBTB44,eGFP-ZBTB48,eGFP-ZBTB49,eGFP-ZBTB6,eGFP-ZBTB7A,eGFP-ZBTB8A,eGFP-ZEB1,eGFP-ZEB2,eGFP-ZFHX2,eGFP-ZFP3,eGFP-ZFP37,eGFP-ZFP41,eGFP-ZFP64,eGFP-ZFP69B,eGFP-ZFX,eGFP-ZIC2,eGFP-ZIK1,eGFP-ZKSCAN8,eGFP-ZNF10,eGFP-ZNF101,eGFP-ZNF112,eGFP-ZNF114,eGFP-ZNF121,eGFP-ZNF132,eGFP-ZNF133,eGFP-ZNF138,eGFP-ZNF140,eGFP-ZNF146,eGFP-ZNF148,eGFP-ZNF155,eGFP-ZNF157,eGFP-ZNF16,eGFP-ZNF169,eGFP-ZNF174,eGFP-ZNF175,eGFP-ZNF18,eGFP-ZNF184,eGFP-ZNF189,eGFP-ZNF19,eGFP-ZNF195,eGFP-ZNF197,eGFP-ZNF2,eGFP-ZNF202,eGFP-ZNF211,eGFP-ZNF213,eGFP-ZNF214,eGFP-ZNF221,eGFP-ZNF223,eGFP-ZNF23,eGFP-ZNF239,eGFP-ZNF24,eGFP-ZNF248,eGFP-ZNF26,eGFP-ZNF266,eGFP-ZNF274,eGFP-ZNF280C,eGFP-ZNF280D,eGFP-ZNF292,eGFP-ZNF300,eGFP-ZNF302,eGFP-ZNF311,eGFP-ZNF324,eGFP-ZNF331,eGFP-ZNF335,eGFP-ZNF34,eGFP-ZNF341,eGFP-ZNF350,eGFP-ZNF354B,eGFP-ZNF354C,eGFP-ZNF362,eGFP-ZNF366,eGFP-ZNF37A,eGFP-ZNF391,eGFP-ZNF394,eGFP-ZNF395,eGFP-ZNF398,eGFP-ZNF404,eGFP-ZNF416,eGFP-ZNF423,eGFP-ZNF426,eGFP-ZNF433,eGFP-ZNF449,eGFP-ZNF473,eGFP-ZNF48,eGFP-ZNF488,eGFP-ZNF491,eGFP-ZNF493,eGFP-ZNF501,eGFP-ZNF507,eGFP-ZNF510,eGFP-ZNF512,eGFP-ZNF513,eGFP-ZNF514,eGFP-ZNF518A,eGFP-ZNF521,eGFP-ZNF524,eGFP-ZNF529,eGFP-ZNF530,eGFP-ZNF544,eGFP-ZNF547,eGFP-ZNF548,eGFP-ZNF549,eGFP-ZNF555,eGFP-ZNF558,eGFP-ZNF560,eGFP-ZNF561,eGFP-ZNF571,eGFP-ZNF577,eGFP-ZNF580,eGFP-ZNF584,eGFP-ZNF585B,eGFP-ZNF589,eGFP-ZNF596,eGFP-ZNF600,eGFP-ZNF610,eGFP-ZNF621,eGFP-ZNF623,eGFP-ZNF624,eGFP-ZNF629,eGFP-ZNF639,eGFP-ZNF644,eGFP-ZNF645,eGFP-ZNF654,eGFP-ZNF658,eGFP-ZNF660,eGFP-ZNF662,eGFP-ZNF664,eGFP-ZNF670,eGFP-ZNF677,eGFP-ZNF680,eGFP-ZNF692,eGFP-ZNF697,eGFP-ZNF701,eGFP-ZNF704,eGFP-ZNF707,eGFP-ZNF740,eGFP-ZNF747,eGFP-ZNF76,eGFP-ZNF766,eGFP-ZNF768,eGFP-ZNF770,eGFP-ZNF776,eGFP-ZNF777,eGFP-ZNF781,eGFP-ZNF785,eGFP-ZNF791,eGFP-ZNF792,eGFP-ZNF83,eGFP-ZNF837,eGFP-ZNF843,eGFP-ZSCAN16,eGFP-ZSCAN18,eGFP-ZSCAN21,eGFP-ZSCAN23,eGFP-ZSCAN26,eGFP-ZSCAN30,eGFP-ZSCAN4,eGFP-ZSCAN5A,eGFP-ZSCAN5C,eGFP-ZXDB,hBMAL1,hHIF1A
cell_type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1,Unnamed: 289_level_1,Unnamed: 290_level_1,Unnamed: 291_level_1,Unnamed: 292_level_1,Unnamed: 293_level_1,Unnamed: 294_level_1,Unnamed: 295_level_1,Unnamed: 296_level_1,Unnamed: 297_level_1,Unnamed: 298_level_1,Unnamed: 299_level_1,Unnamed: 300_level_1,Unnamed: 301_level_1,Unnamed: 302_level_1,Unnamed: 303_level_1,Unnamed: 304_level_1,Unnamed: 305_level_1,Unnamed: 306_level_1,Unnamed: 307_level_1,Unnamed: 308_level_1,Unnamed: 309_level_1,Unnamed: 310_level_1,Unnamed: 311_level_1,Unnamed: 312_level_1,Unnamed: 313_level_1,Unnamed: 314_level_1,Unnamed: 315_level_1,Unnamed: 316_level_1,Unnamed: 317_level_1,Unnamed: 318_level_1,Unnamed: 319_level_1,Unnamed: 320_level_1,Unnamed: 321_level_1,Unnamed: 322_level_1,Unnamed: 323_level_1,Unnamed: 324_level_1,Unnamed: 325_level_1,Unnamed: 326_level_1,Unnamed: 327_level_1,Unnamed: 328_level_1,Unnamed: 329_level_1,Unnamed: 330_level_1,Unnamed: 331_level_1,Unnamed: 332_level_1,Unnamed: 333_level_1,Unnamed: 334_level_1,Unnamed: 335_level_1,Unnamed: 336_level_1,Unnamed: 337_level_1,Unnamed: 338_level_1,Unnamed: 339_level_1,Unnamed: 340_level_1,Unnamed: 341_level_1,Unnamed: 342_level_1,Unnamed: 343_level_1,Unnamed: 344_level_1,Unnamed: 345_level_1,Unnamed: 346_level_1,Unnamed: 347_level_1,Unnamed: 348_level_1,Unnamed: 349_level_1,Unnamed: 350_level_1,Unnamed: 351_level_1,Unnamed: 352_level_1,Unnamed: 353_level_1,Unnamed: 354_level_1,Unnamed: 355_level_1,Unnamed: 356_level_1,Unnamed: 357_level_1,Unnamed: 358_level_1,Unnamed: 359_level_1,Unnamed: 360_level_1,Unnamed: 361_level_1,Unnamed: 362_level_1,Unnamed: 363_level_1,Unnamed: 364_level_1,Unnamed: 365_level_1,Unnamed: 366_level_1,Unnamed: 367_level_1,Unnamed: 368_level_1,Unnamed: 369_level_1,Unnamed: 370_level_1,Unnamed: 371_level_1,Unnamed: 372_level_1,Unnamed: 373_level_1,Unnamed: 374_level_1,Unnamed: 375_level_1,Unnamed: 376_level_1,Unnamed: 377_level_1,Unnamed: 378_level_1,Unnamed: 379_level_1,Unnamed: 380_level_1,Unnamed: 381_level_1,Unnamed: 382_level_1,Unnamed: 383_level_1,Unnamed: 384_level_1,Unnamed: 385_level_1,Unnamed: 386_level_1,Unnamed: 387_level_1,Unnamed: 388_level_1,Unnamed: 389_level_1,Unnamed: 390_level_1,Unnamed: 391_level_1,Unnamed: 392_level_1,Unnamed: 393_level_1,Unnamed: 394_level_1,Unnamed: 395_level_1,Unnamed: 396_level_1,Unnamed: 397_level_1,Unnamed: 398_level_1,Unnamed: 399_level_1,Unnamed: 400_level_1,Unnamed: 401_level_1,Unnamed: 402_level_1,Unnamed: 403_level_1,Unnamed: 404_level_1,Unnamed: 405_level_1,Unnamed: 406_level_1,Unnamed: 407_level_1,Unnamed: 408_level_1,Unnamed: 409_level_1,Unnamed: 410_level_1,Unnamed: 411_level_1,Unnamed: 412_level_1,Unnamed: 413_level_1,Unnamed: 414_level_1,Unnamed: 415_level_1,Unnamed: 416_level_1,Unnamed: 417_level_1,Unnamed: 418_level_1,Unnamed: 419_level_1,Unnamed: 420_level_1,Unnamed: 421_level_1,Unnamed: 422_level_1,Unnamed: 423_level_1,Unnamed: 424_level_1,Unnamed: 425_level_1,Unnamed: 426_level_1,Unnamed: 427_level_1,Unnamed: 428_level_1,Unnamed: 429_level_1,Unnamed: 430_level_1,Unnamed: 431_level_1,Unnamed: 432_level_1,Unnamed: 433_level_1,Unnamed: 434_level_1,Unnamed: 435_level_1,Unnamed: 436_level_1,Unnamed: 437_level_1,Unnamed: 438_level_1,Unnamed: 439_level_1,Unnamed: 440_level_1,Unnamed: 441_level_1,Unnamed: 442_level_1,Unnamed: 443_level_1,Unnamed: 444_level_1,Unnamed: 445_level_1,Unnamed: 446_level_1,Unnamed: 447_level_1,Unnamed: 448_level_1,Unnamed: 449_level_1,Unnamed: 450_level_1,Unnamed: 451_level_1,Unnamed: 452_level_1,Unnamed: 453_level_1,Unnamed: 454_level_1,Unnamed: 455_level_1,Unnamed: 456_level_1,Unnamed: 457_level_1,Unnamed: 458_level_1,Unnamed: 459_level_1,Unnamed: 460_level_1,Unnamed: 461_level_1,Unnamed: 462_level_1,Unnamed: 463_level_1,Unnamed: 464_level_1,Unnamed: 465_level_1,Unnamed: 466_level_1,Unnamed: 467_level_1,Unnamed: 468_level_1,Unnamed: 469_level_1,Unnamed: 470_level_1,Unnamed: 471_level_1,Unnamed: 472_level_1,Unnamed: 473_level_1,Unnamed: 474_level_1,Unnamed: 475_level_1,Unnamed: 476_level_1,Unnamed: 477_level_1,Unnamed: 478_level_1,Unnamed: 479_level_1,Unnamed: 480_level_1,Unnamed: 481_level_1,Unnamed: 482_level_1,Unnamed: 483_level_1,Unnamed: 484_level_1,Unnamed: 485_level_1,Unnamed: 486_level_1,Unnamed: 487_level_1,Unnamed: 488_level_1,Unnamed: 489_level_1,Unnamed: 490_level_1,Unnamed: 491_level_1,Unnamed: 492_level_1,Unnamed: 493_level_1,Unnamed: 494_level_1,Unnamed: 495_level_1,Unnamed: 496_level_1,Unnamed: 497_level_1,Unnamed: 498_level_1,Unnamed: 499_level_1,Unnamed: 500_level_1,Unnamed: 501_level_1,Unnamed: 502_level_1,Unnamed: 503_level_1,Unnamed: 504_level_1,Unnamed: 505_level_1,Unnamed: 506_level_1,Unnamed: 507_level_1,Unnamed: 508_level_1,Unnamed: 509_level_1,Unnamed: 510_level_1,Unnamed: 511_level_1,Unnamed: 512_level_1,Unnamed: 513_level_1,Unnamed: 514_level_1,Unnamed: 515_level_1,Unnamed: 516_level_1,Unnamed: 517_level_1,Unnamed: 518_level_1,Unnamed: 519_level_1,Unnamed: 520_level_1,Unnamed: 521_level_1,Unnamed: 522_level_1,Unnamed: 523_level_1,Unnamed: 524_level_1,Unnamed: 525_level_1,Unnamed: 526_level_1,Unnamed: 527_level_1,Unnamed: 528_level_1,Unnamed: 529_level_1,Unnamed: 530_level_1,Unnamed: 531_level_1,Unnamed: 532_level_1,Unnamed: 533_level_1,Unnamed: 534_level_1,Unnamed: 535_level_1,Unnamed: 536_level_1,Unnamed: 537_level_1,Unnamed: 538_level_1,Unnamed: 539_level_1,Unnamed: 540_level_1,Unnamed: 541_level_1,Unnamed: 542_level_1,Unnamed: 543_level_1,Unnamed: 544_level_1,Unnamed: 545_level_1,Unnamed: 546_level_1,Unnamed: 547_level_1,Unnamed: 548_level_1,Unnamed: 549_level_1,Unnamed: 550_level_1,Unnamed: 551_level_1,Unnamed: 552_level_1,Unnamed: 553_level_1,Unnamed: 554_level_1,Unnamed: 555_level_1,Unnamed: 556_level_1,Unnamed: 557_level_1,Unnamed: 558_level_1,Unnamed: 559_level_1,Unnamed: 560_level_1,Unnamed: 561_level_1,Unnamed: 562_level_1,Unnamed: 563_level_1,Unnamed: 564_level_1,Unnamed: 565_level_1,Unnamed: 566_level_1,Unnamed: 567_level_1,Unnamed: 568_level_1,Unnamed: 569_level_1,Unnamed: 570_level_1,Unnamed: 571_level_1,Unnamed: 572_level_1,Unnamed: 573_level_1,Unnamed: 574_level_1,Unnamed: 575_level_1,Unnamed: 576_level_1,Unnamed: 577_level_1,Unnamed: 578_level_1,Unnamed: 579_level_1,Unnamed: 580_level_1,Unnamed: 581_level_1,Unnamed: 582_level_1,Unnamed: 583_level_1,Unnamed: 584_level_1,Unnamed: 585_level_1,Unnamed: 586_level_1,Unnamed: 587_level_1,Unnamed: 588_level_1,Unnamed: 589_level_1,Unnamed: 590_level_1,Unnamed: 591_level_1,Unnamed: 592_level_1,Unnamed: 593_level_1,Unnamed: 594_level_1,Unnamed: 595_level_1,Unnamed: 596_level_1,Unnamed: 597_level_1,Unnamed: 598_level_1,Unnamed: 599_level_1,Unnamed: 600_level_1,Unnamed: 601_level_1,Unnamed: 602_level_1,Unnamed: 603_level_1,Unnamed: 604_level_1,Unnamed: 605_level_1,Unnamed: 606_level_1,Unnamed: 607_level_1,Unnamed: 608_level_1,Unnamed: 609_level_1,Unnamed: 610_level_1,Unnamed: 611_level_1,Unnamed: 612_level_1,Unnamed: 613_level_1,Unnamed: 614_level_1,Unnamed: 615_level_1,Unnamed: 616_level_1,Unnamed: 617_level_1,Unnamed: 618_level_1,Unnamed: 619_level_1,Unnamed: 620_level_1,Unnamed: 621_level_1,Unnamed: 622_level_1,Unnamed: 623_level_1,Unnamed: 624_level_1,Unnamed: 625_level_1,Unnamed: 626_level_1,Unnamed: 627_level_1,Unnamed: 628_level_1,Unnamed: 629_level_1,Unnamed: 630_level_1,Unnamed: 631_level_1,Unnamed: 632_level_1,Unnamed: 633_level_1,Unnamed: 634_level_1,Unnamed: 635_level_1,Unnamed: 636_level_1,Unnamed: 637_level_1,Unnamed: 638_level_1,Unnamed: 639_level_1,Unnamed: 640_level_1,Unnamed: 641_level_1,Unnamed: 642_level_1,Unnamed: 643_level_1,Unnamed: 644_level_1,Unnamed: 645_level_1,Unnamed: 646_level_1,Unnamed: 647_level_1,Unnamed: 648_level_1,Unnamed: 649_level_1,Unnamed: 650_level_1,Unnamed: 651_level_1,Unnamed: 652_level_1,Unnamed: 653_level_1,Unnamed: 654_level_1,Unnamed: 655_level_1,Unnamed: 656_level_1,Unnamed: 657_level_1,Unnamed: 658_level_1,Unnamed: 659_level_1,Unnamed: 660_level_1,Unnamed: 661_level_1,Unnamed: 662_level_1,Unnamed: 663_level_1,Unnamed: 664_level_1,Unnamed: 665_level_1,Unnamed: 666_level_1,Unnamed: 667_level_1,Unnamed: 668_level_1,Unnamed: 669_level_1,Unnamed: 670_level_1,Unnamed: 671_level_1,Unnamed: 672_level_1,Unnamed: 673_level_1,Unnamed: 674_level_1,Unnamed: 675_level_1,Unnamed: 676_level_1,Unnamed: 677_level_1,Unnamed: 678_level_1,Unnamed: 679_level_1,Unnamed: 680_level_1,Unnamed: 681_level_1,Unnamed: 682_level_1,Unnamed: 683_level_1,Unnamed: 684_level_1,Unnamed: 685_level_1,Unnamed: 686_level_1,Unnamed: 687_level_1,Unnamed: 688_level_1,Unnamed: 689_level_1,Unnamed: 690_level_1,Unnamed: 691_level_1,Unnamed: 692_level_1,Unnamed: 693_level_1,Unnamed: 694_level_1,Unnamed: 695_level_1,Unnamed: 696_level_1,Unnamed: 697_level_1,Unnamed: 698_level_1,Unnamed: 699_level_1,Unnamed: 700_level_1,Unnamed: 701_level_1,Unnamed: 702_level_1,Unnamed: 703_level_1,Unnamed: 704_level_1,Unnamed: 705_level_1,Unnamed: 706_level_1,Unnamed: 707_level_1,Unnamed: 708_level_1,Unnamed: 709_level_1,Unnamed: 710_level_1,Unnamed: 711_level_1,Unnamed: 712_level_1,Unnamed: 713_level_1,Unnamed: 714_level_1,Unnamed: 715_level_1,Unnamed: 716_level_1,Unnamed: 717_level_1,Unnamed: 718_level_1,Unnamed: 719_level_1,Unnamed: 720_level_1,Unnamed: 721_level_1,Unnamed: 722_level_1,Unnamed: 723_level_1,Unnamed: 724_level_1,Unnamed: 725_level_1,Unnamed: 726_level_1,Unnamed: 727_level_1,Unnamed: 728_level_1,Unnamed: 729_level_1,Unnamed: 730_level_1,Unnamed: 731_level_1,Unnamed: 732_level_1,Unnamed: 733_level_1,Unnamed: 734_level_1,Unnamed: 735_level_1,Unnamed: 736_level_1,Unnamed: 737_level_1,Unnamed: 738_level_1,Unnamed: 739_level_1,Unnamed: 740_level_1,Unnamed: 741_level_1,Unnamed: 742_level_1,Unnamed: 743_level_1,Unnamed: 744_level_1,Unnamed: 745_level_1,Unnamed: 746_level_1,Unnamed: 747_level_1,Unnamed: 748_level_1,Unnamed: 749_level_1,Unnamed: 750_level_1,Unnamed: 751_level_1,Unnamed: 752_level_1,Unnamed: 753_level_1,Unnamed: 754_level_1,Unnamed: 755_level_1,Unnamed: 756_level_1,Unnamed: 757_level_1,Unnamed: 758_level_1,Unnamed: 759_level_1,Unnamed: 760_level_1,Unnamed: 761_level_1,Unnamed: 762_level_1,Unnamed: 763_level_1,Unnamed: 764_level_1,Unnamed: 765_level_1,Unnamed: 766_level_1,Unnamed: 767_level_1,Unnamed: 768_level_1,Unnamed: 769_level_1,Unnamed: 770_level_1,Unnamed: 771_level_1,Unnamed: 772_level_1,Unnamed: 773_level_1,Unnamed: 774_level_1,Unnamed: 775_level_1,Unnamed: 776_level_1,Unnamed: 777_level_1,Unnamed: 778_level_1,Unnamed: 779_level_1,Unnamed: 780_level_1,Unnamed: 781_level_1,Unnamed: 782_level_1,Unnamed: 783_level_1,Unnamed: 784_level_1,Unnamed: 785_level_1,Unnamed: 786_level_1,Unnamed: 787_level_1,Unnamed: 788_level_1,Unnamed: 789_level_1,Unnamed: 790_level_1,Unnamed: 791_level_1
22Rv1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[4095],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[2644],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[2222],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
22Rv1 treated with 10 nM 17B-hydroxy-5a-androstan-3-one for 4 hours,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[4061],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[3854],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
A172,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[631],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
A549,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[2893],,,[3346],,,,[1245],,,,,[1652],[3137],,,,,,,,,,,"[1084, 1242]",,,,,,,[47],,,,,,,,,,,[2424],,,[3373],,,,[2900],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[1102],,,,,,,,,,,,,,,,[3473],,,,,,,,,,,,,,,,,,,,,,,,[4501],,,,,,[3423],,,[4327],,,,,,,,,,[3112],,[3415],,,,,,,,,,,,,,,,,,,,,[1241],,,,,,,,,,,,,,[3259],,,,,,,,,,,,,,,,,,,,,,,,,,[3111],,,,,[1244],,,,,,,,,,,[1243],,,,,,,,,,,,[3354],,[4195],,[1637],,,[3921],,,,,,,,,[3044],,,,,,,,,,,,,,,[2929],,,,,,,[4218],[3422],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[3189],,,,,,,,,,,,,,,,,,[2313],,,,[2359],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
A549 treated with 0.02% ethanol for 1 hour,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[1015],,,,,,,[1027],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,"[1039, 1040]",,,,,,,,,,,,,,,,,,,,,,,,,,[1016],,,,,,,[1017],,,,,,,,,[1032],[1041],,,,,,,[1019],,,,,,,,,,,[847],,,,,,,,,,,,,,[848],[849],,,[850],[865],[816],,,[837],[826],,,[851],,,[852],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[1042],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,"[911, 937]",,,,,,,,,,,,,,,[889],,,,,,,,,,,,,,,,,,,,,,,,,,[1033],,,,,,,,,,,,,,[1048],,,,[1047],,,,,,,,,,,,,,,,[1009],,,,,,,,,,,,,,,,,,[1010],,,,,,,,,,[1034],,,,,,,,,,,,,,,,,,,,,,,,,[1014],,,,,[1020],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
vagina female adult (51 year),,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[3456],,,,,,,[534],,,,,,,,,,,,,,,[4441],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[3595],,[3441],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
vagina female adult (53 years),,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[3323],,,,,,,[382],,,,,,,,,,,,,,,[4157],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[3671],,[4408],,,,[2253],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[2668],,[4286],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
"vagina, adult",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[5175],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
"vein, adult",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,[5165],,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [53]:
df_pivot.columns

Index(['.', '3xFLAG-AHR', '3xFLAG-ARID4B', '3xFLAG-ATF1', '3xFLAG-ATF4', '3xFLAG-BCL6', '3xFLAG-CEBPA', '3xFLAG-CEBPG', '3xFLAG-CREB1', '3xFLAG-DMAP1',
       ...
       'eGFP-ZSCAN21', 'eGFP-ZSCAN23', 'eGFP-ZSCAN26', 'eGFP-ZSCAN30', 'eGFP-ZSCAN4', 'eGFP-ZSCAN5A', 'eGFP-ZSCAN5C', 'eGFP-ZXDB', 'hBMAL1', 'hHIF1A'], dtype='object', name='assay', length=791)

In [54]:
df_avail = df_pivot[['DNase', 'H3K4me3', 'H3K27ac', 'CTCF']]
df_avail = df_avail[(df_avail.isna().sum(axis=1) == 0)]
df_avail

assay,DNase,H3K4me3,H3K27ac,CTCF
cell_type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
A673,[340],[2783],[3657],[3336]
AG04450,[49],[1109],[1107],[1108]
CD14-positive monocyte female,"[41, 131]","[821, 1215]",[817],[836]
GM12878,"[12, 69]","[686, 1143, 1620]",[688],"[687, 1265]"
GM23338 male adult (53 years) originated from GM23248,[166],[3463],[3702],"[4324, 4474]"
H1-hESC,"[19, 70, 565]","[1509, 3972]","[732, 4164]","[712, 989, 1074]"
HCT116,[88],"[1173, 2467]","[1379, 3485]","[1055, 1172, 2203]"
HeLa-S3,"[25, 654]","[745, 2493]",[743],[742]
IMR-90,[405],[1719],[1452],[1322]
MCF-7,"[128, 130]","[1214, 4469]","[1397, 3773]","[684, 1081, 1213, 3177]"


In [55]:
len(df_avail)

41

In [56]:
assays = ['DNase', 'H3K4me3', 'H3K27ac', 'CTCF']
cell_types = ['K562', 'HepG2', 'SK-N-SH', 'A549', 'HCT116']

In [57]:
df_Sei_Siraj = df_pivot.loc[cell_types][assays]
df_Sei_Siraj.map(lambda x: len(x) if isinstance(x, list) else 0)

assay,DNase,H3K4me3,H3K27ac,CTCF
cell_type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
HepG2,3,3,0,1
K562,4,4,0,4
SK-N-SH,0,2,2,2
A549,1,1,0,2
HCT116,1,2,2,3


In [10]:
model_info_df = pd.read_csv('../pretrained_models/Sei/Sei_info.csv')
MPRA_df = pd.read_csv('../data/SirajMPRA/SirajMPRA_562654.csv')

In [11]:
assays = ['DNase', 'H3K4me1', 'H3K4me3', 'H3K9me3', 'H3K27me3', 'H3K27ac', 'H3K36me3', 'CTCF']
cell_types = ['K562', 'HepG2', 'SK-N-SH', 'A549', 'HCT116']

# # 定义细胞所有可能的名字
cell_names_dict = {
    'HepG2': [
        r"HepG2",
        r"Hep-G2",
        ],
    'K562': [
        r"K562",
        r"K-562",
    ],
    'SK-N-SH': [
        r"SK-N-SH",
        r"SKNSH",
        r"SKN-SH",
        r"SK-NSH",
        r"neuroblastoma",
    ],
    'A549': [
        r"A549",
        r"A-549",
    ],
    'HCT116': [
        r"HCT116",
        r"HCT-116",
    ],
}


for cell_type in cell_names_dict:
    cell_names = cell_names_dict[cell_type]
    pattern = re.compile("|".join(cell_names), re.IGNORECASE) # 不区分大小写
    matched_indice = [i for i in range(len(model_info_df))
                      if (pattern.search(model_info_df['cell_type'][i])) and (model_info_df['assay'][i] in assays)]

    counter = Counter(model_info_df.iloc[matched_indice]['cell_type'])
    for a in counter.most_common():
        print(a)
    print()

('HepG2_Epithelium_Liver', 42)
('HepG2_Hepatocellular_Carcinoma', 7)
('HepG2', 5)

('K562_Erythroblast_Bone_Marrow', 284)
('K562', 13)
('K562_Leukemia', 8)
('K562_Leukemia_Bone', 2)
('K562_human_erythroleukemic_cell_line', 1)

('Neuroblastoma_cell', 16)
('SHEP-21N_Neuroblastoma_cell_Bone_Marrow', 12)
('SK-N-SH_RA_Neuron_Brain', 9)
('SK-N-SH_Neuroblastoma_cell_Brain', 8)
('IMR-5_75_Neuroblastoma_cell', 4)
('SH-SY5Y_Neuroblastoma_cell', 4)
('Neuroblastoma_patient_cells', 3)
('SK-N-SH_RA', 3)
('BE2-C_Neuroblastoma_cell', 2)
('LAN-1_Neuroblastoma_cell', 2)
('CLB-Ga_Neuroblastoma_cell', 2)
('NB-1643_Neuroblastoma_cell', 1)
('SK-N-BE(2)c_Neuroblastoma_cell', 1)
('SJNB-8_Neuroblastoma_cell', 1)
('SK-N-DZ_Neuroblastoma_cell', 1)
('IMR-32_Neuroblastoma_cell', 1)
('SK-N-AS_Neuroblastoma_cell', 1)
('SJNB-6_Neuroblastoma_cell', 1)
('EBC-1_Neuroblastoma_cell', 1)
('KELLY_Neuroblastoma_cell', 1)
('CHP-212_Neuroblastoma_cell', 1)
('GI-CA-N_Neuroblastoma_cell', 1)
('SH-EP_Neuroblastoma_cell', 1)
('SJN

In [12]:
# # 定义细胞所有可能的名字
cell_names_dict = {
    'HepG2'  : ["HepG2_Epithelium_Liver", "HepG2_Hepatocellular_Carcinoma", "HepG2"],
    'K562'   : ["K562_Erythroblast_Bone_Marrow", "K562"],
    'SK-N-SH': ["SK-N-SH_RA_Neuron_Brain", "SK-N-SH_Neuroblastoma_cell_Brain", "SK-N-SH_RA"],
    #'A549'   : ["A549_Epithelium_Lung", "A549"],
    'A549'   : ["A549_Epithelium_Lung"],
    'HCT116' : ["HCT-116_Colon", "HCT-116_HCT116", "HCT-116"],
}


cell_types = ['K562', 'HepG2', 'SK-N-SH', 'A549', 'HCT116']
assays = ['DNase', 'H3K4me1', 'H3K4me3', 'H3K9me3', 'H3K27me3', 'H3K27ac', 'H3K36me3', 'CTCF']
index_df = pd.DataFrame(index=cell_types, columns=assays)

for cell_type in cell_types:
    for assay in assays:
        indice = []
        for cell_name in cell_names_dict[cell_type]:
            mask = (model_info_df['cell_type'].str.upper() == cell_name.upper()) & (model_info_df['assay'] == assay) # 不区分大小写
            index = model_info_df[mask].index.tolist()
            indice.extend(index)
        index_df.loc[cell_type, assay] = indice

index_df_len = index_df.map(len)
index_df_len

Unnamed: 0,DNase,H3K4me1,H3K4me3,H3K9me3,H3K27me3,H3K27ac,H3K36me3,CTCF
HepG2,9,4,8,2,2,9,3,17
K562,58,10,91,21,34,51,5,27
SK-N-SH,4,0,4,0,1,3,1,7
A549,3,37,45,27,3,53,1,8
HCT116,7,18,39,1,1,49,4,14


In [13]:
predicted_array = np.load('../pretrained_models/Sei/Sei_Siraj_pred_562654.npy')

In [14]:
cell_types = ['K562', 'HepG2', 'SK-N-SH', 'A549', 'HCT116']
assays = ['DNase', 'H3K4me3', 'H3K27ac', 'CTCF']

feature_matrix = np.full(shape=(len(predicted_array), len(cell_types), len(assays)), fill_value=np.nan)
print(feature_matrix.shape)

(562654, 5, 4)


In [17]:
# average every channel

pearson_array = np.zeros((len(cell_types), len(assays)))
for i, cell_type in enumerate(cell_types):
    for j, assay in enumerate(assays):
        indice = index_df.iloc[i, j]
        if indice:
            predicted_feature = logit(predicted_array[:, indice]).mean(1)
            true_label = MPRA_df[cell_type]
            r, _ = pearson(predicted_feature, true_label)
            feature_matrix[:, i, j] = predicted_feature
            pearson_array[i, j] = r

print(pearson_array)
# print(feature_matrix.mean(-1))

[[ 0.443  0.351  0.469 -0.011]
 [ 0.499  0.388  0.451  0.285]
 [ 0.368  0.     0.462  0.   ]
 [ 0.345  0.304  0.362  0.237]
 [ 0.426  0.435  0.446 -0.057]]


In [11]:
# # if use less cell name
# cell_names_dict = {
#     'HepG2'  : ["HepG2_Epithelium_Liver"],
#     'K562'   : ["K562_Erythroblast_Bone_Marrow"],
#     'SK-N-SH': ["SK-N-SH_RA_Neuron_Brain", "SK-N-SH_Neuroblastoma_cell_Brain", "SK-N-SH_RA"],
#     'A549'   : ["A549_Epithelium_Lung"],
#     'HCT116' : ["HCT-116_Colon", "HCT-116_HCT116"],
# }


# cell_types = ['K562', 'HepG2', 'SK-N-SH', 'A549', 'HCT116']
# assays = ['DNase', 'H3K4me1', 'H3K4me3', 'H3K9me3', 'H3K27me3', 'H3K27ac', 'H3K36me3', 'CTCF']
# index_list = []
# index_df = pd.DataFrame(index=cell_types, columns=assays)

# for cell_type in cell_types:
#     for assay in assays:
#         indice = []
#         for cell_name in cell_names_dict[cell_type]:
#             mask = (model_info_df['cell_type'].str.upper() == cell_name.upper()) & (model_info_df['assay'] == assay) # 不区分大小写
#             index = model_info_df[mask].index.tolist()
#             indice.extend(index)

#         index_df.loc[cell_type, assay] = indice
#         index_list.extend(indice)

# index_df_len = index_df.map(len)
# print(index_df_len)


# pearson_array = np.zeros((len(cell_types), len(assays)))
# for i, cell_type in enumerate(cell_types):
#     for j, assay in enumerate(assays):
#         indice = index_df.iloc[i, j]
#         if indice:
#             predicted_feature = logit(predicted_array[:, indice]).mean(1)
#             true_label = MPRA_df[cell_type]
#             r = pearson(predicted_feature, true_label)
#             feature_matrix[:, i, j] = predicted_feature
#             pearson_array[i, j] = r

# print(pearson_array)