# Kinase profiling data

Show here how to load different profiling datasets.

In [1]:
from pathlib import Path

import json
import pandas as pd

In [2]:
HERE = Path(_dh[-1])  # noqa: F821

## Karaman dataset

In [3]:
karaman_path = HERE / "Karaman/Karaman_profiling.js"

In [4]:
with open(karaman_path, "r") as f:
    json_string = f.read()
json_string_cleaned = json_string.replace("=", ": ").replace(";", ", ").replace("\n", "")
json_string_cleaned = json_string_cleaned.replace("karaman_compounds", "\"karaman_compounds\"")
json_string_cleaned = json_string_cleaned.replace("karaman_profiling", "\"karaman_profiling\"")
json_string_cleaned = json_string_cleaned[:-3] + "}"
karaman_dict = json.loads(json_string_cleaned)

karaman_df = {}
for ligand, measures in karaman_dict["karaman_profiling"].items():
    karaman_df[ligand] = {measure["xName"]: measure["Kd(nM)"] for measure in measures}
karaman_df = pd.DataFrame(karaman_df)
print(karaman_df.shape)
karaman_df.head()

(268, 30)


Unnamed: 0,Staurosporine,JNJ-7706621,MLN-8054,PKC-412,SU-14813,SB-202190,CP-724714,VX-680/MK-0457,Dasatinib,Roscovitine/CYC-202,...,ZD-6474,Sunitinib,Flavopiridol,Erlotinib,MLN-518,LY-333531,CI-1033,EKB-569,PI-103,PTK-787
AAK1,1.2,200.0,,48.0,66.0,,,290.0,,,...,,11.0,5300.0,1200.0,,900.0,,3500.0,,
ABL1,290.0,1200.0,820.0,,1500.0,,,13.0,0.53,,...,270.0,830.0,,310.0,,,1400.0,560.0,,
ABL2,110.0,,3300.0,,,,,4.0,0.17,,...,69.0,1000.0,,200.0,,,870.0,370.0,,
ALK2,470.0,5900.0,,,,,,1900.0,620.0,,...,150.0,,1900.0,,2500.0,,1700.0,,,
ALK4,680.0,,,,,950.0,,,330.0,,...,,,,,,,,,,


## PKIS2 dataset

In [5]:
pkis2_path = HERE / "PKIS2/pone.0181585.s004.xlsx"

In [6]:
pkis2_df = pd.read_excel(pkis2_path)
pkis2_df = pkis2_df.set_index("Compound").iloc[:-1, 6:]
print(pkis2_df.shape)
pkis2_df.head()

(645, 406)


  warn(msg)


Unnamed: 0_level_0,AAK1,ABL1-nonphosphorylated,ABL1-phosphorylated,ABL2,ACVR1,ACVR1B,ACVR2A,ACVR2B,ACVRL1,ADCK3,...,YANK3,YES,YSK1,YSK4,ZAK,ZAP70,p38-alpha,p38-beta,p38-delta,p38-gamma
Compound,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
UNC10225469A,14.0,28.0,20.0,5.0,0.0,0.0,0.0,0.0,9.0,11.0,...,0.0,9.0,0.0,0.0,12.0,10.0,0.0,8.0,4.0,23.0
UNC10225012A,0.0,99.7,89.0,81.0,7.0,9.0,0.0,0.0,0.0,7.0,...,0.0,55.0,6.0,43.0,59.0,0.0,8.0,1.0,0.0,14.0
UNC10225159A,0.0,8.0,15.0,5.0,18.0,0.0,0.0,0.0,0.0,24.0,...,3.0,36.0,0.0,16.0,15.0,22.0,2.0,6.0,0.0,43.0
UNC10225310A,0.0,28.0,18.0,100.0,17.0,15.0,7.0,27.0,7.0,0.0,...,0.0,36.0,1.0,0.0,66.0,0.0,21.0,90.0,11.0,24.0
UNC10225187A,26.0,49.0,23.0,3.0,10.0,85.0,2.0,0.0,0.0,5.0,...,0.0,10.0,0.0,0.0,39.0,0.0,10.0,57.0,0.0,46.0
