**Target: Proteasome**

Organism: Homo sapiens

Protein: Proteasome subunit beta type-5

Gene Names: PSMB5 LMPX, MB1, X

PSMB5 is one of the 17 essential subunits that contributes to the complete assembly of 20S proteasome complex

In [None]:
# Installing ChEMBL resources
! pip install chembl_webresource_client

In [None]:
# Import Dependencies
import pandas as pd
from chembl_webresource_client.new_client import new_client

In [None]:
# Searching Proteasome as a target
# Proteasomes are part of a major mechanism by which cells regulate the concentration of particular proteins and degrade misfolded proteins.
target = new_client.target
target_query = target.search('proteasome')
targets = pd.DataFrame.from_dict(target_query)
targets

Unnamed: 0,cross_references,organism,pref_name,score,species_group_flag,target_chembl_id,target_components,target_type,tax_id
0,[],Homo sapiens,Proteasome subunit beta type-3,16.0,False,CHEMBL3308923,"[{'accession': 'P49720', 'component_descriptio...",SINGLE PROTEIN,9606.0
1,"[{'xref_id': 'P28074', 'xref_name': None, 'xre...",Homo sapiens,Proteasome Macropain subunit MB1,15.0,False,CHEMBL4662,"[{'accession': 'P28074', 'component_descriptio...",SINGLE PROTEIN,9606.0
2,[],Mus musculus,Proteasome subunit beta type-5,15.0,False,CHEMBL1944494,"[{'accession': 'O55234', 'component_descriptio...",SINGLE PROTEIN,10090.0
3,[],Rattus norvegicus,26S proteasome non-ATPase regulatory subunit 1,15.0,False,CHEMBL2176782,"[{'accession': 'O88761', 'component_descriptio...",SINGLE PROTEIN,10116.0
4,[],Homo sapiens,26S proteasome,15.0,False,CHEMBL2364701,"[{'accession': 'Q99460', 'component_descriptio...",PROTEIN COMPLEX,9606.0
5,[],Homo sapiens,20S proteasome,15.0,False,CHEMBL3831201,"[{'accession': 'P49721', 'component_descriptio...",PROTEIN COMPLEX,9606.0
6,[],Homo sapiens,Proteasome subunit beta type-1/beta type-5,15.0,False,CHEMBL3885625,"[{'accession': 'P20618', 'component_descriptio...",PROTEIN FAMILY,9606.0
7,[],Rattus norvegicus,Proteasome subunit beta type-5,15.0,False,CHEMBL4523208,"[{'accession': 'P28075', 'component_descriptio...",SINGLE PROTEIN,10116.0
8,"[{'xref_id': 'P20618', 'xref_name': None, 'xre...",Homo sapiens,Proteasome component C5,14.0,False,CHEMBL4208,"[{'accession': 'P20618', 'component_descriptio...",SINGLE PROTEIN,9606.0
9,[],Homo sapiens,Proteasome subunit beta type-6,14.0,False,CHEMBL1944496,"[{'accession': 'P28072', 'component_descriptio...",SINGLE PROTEIN,9606.0


In [None]:
# selecting target number 1, PSMB5 or MB1 in Homo sapiens
selected_target = targets.target_chembl_id[1]
selected_target

'CHEMBL4662'

In [None]:
# Bioactivity data involving only IC50 values
activity = new_client.activity
res = activity.filter(target_chembl_id=selected_target).filter(standard_type="IC50")

In [None]:
df = pd.DataFrame.from_dict(res)

In [None]:
df

Unnamed: 0,activity_comment,activity_id,activity_properties,assay_chembl_id,assay_description,assay_type,assay_variant_accession,assay_variant_mutation,bao_endpoint,bao_format,bao_label,canonical_smiles,data_validity_comment,data_validity_description,document_chembl_id,document_journal,document_year,ligand_efficiency,molecule_chembl_id,molecule_pref_name,parent_molecule_chembl_id,pchembl_value,potential_duplicate,qudt_units,record_id,relation,src_id,standard_flag,standard_relation,standard_text_value,standard_type,standard_units,standard_upper_value,standard_value,target_chembl_id,target_organism,target_pref_name,target_tax_id,text_value,toid,type,units,uo_units,upper_value,value
0,,1709326,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N[C@@H](...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '12.18', 'le': '0.24', 'lle': '5.13', ...",CHEMBL381735,,CHEMBL381735,8.62,False,http://www.openphacts.org/units/Nanomolar,471603,=,1,True,=,,IC50,nM,,2.4,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.0024
1,,1709327,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N1CCC[C@...,Outside typical range,Values for this activity type are unusually la...,CHEMBL1147675,J. Med. Chem.,2006,,CHEMBL207670,,CHEMBL207670,,False,http://www.openphacts.org/units/Nanomolar,471604,=,1,True,=,,IC50,nM,,150000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,150.0
2,,1709328,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(=O)N[C@@H](CCC(=O)OC(C)(C)C)C(=O)N[C@@H](C)...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '13.45', 'le': '0.27', 'lle': '5.38', ...",CHEMBL383529,,CHEMBL383529,6.58,False,http://www.openphacts.org/units/Nanomolar,471605,=,1,True,=,,IC50,nM,,260.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.26
3,,1709330,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '14.08', 'le': '0.28', 'lle': '5.27', ...",CHEMBL207336,,CHEMBL207336,7.77,False,http://www.openphacts.org/units/Nanomolar,471606,=,1,True,=,,IC50,nM,,17.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.017
4,,1709331,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '14.12', 'le': '0.28', 'lle': '5.21', ...",CHEMBL208015,,CHEMBL208015,8.21,False,http://www.openphacts.org/units/Nanomolar,471607,=,1,True,=,,IC50,nM,,6.1,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.0061
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1159,,20606995,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,C[C@]1(C(=O)[C@H](Cc2ccccc2)NC(=O)[C@H](CO)NC(...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4100295,,CHEMBL4100295,,False,http://www.openphacts.org/units/Nanomolar,3466569,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1160,,20606996,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(=O)NCC(=O)N1CCC[C@H]1C(=O)N[C@@H](Cc1ccccc1...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4646371,,CHEMBL4646371,,False,http://www.openphacts.org/units/Nanomolar,3466570,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1161,,20606997,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@@H]...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4649310,,CHEMBL4649310,,False,http://www.openphacts.org/units/Nanomolar,3466597,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1162,,20606998,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,COc1ccc(C[C@H](NC(=O)[C@H](C)NC(=O)CN2CCOCC2)C...,,,CHEMBL4602696,J Med Chem,2020,"{'bei': '10.89', 'le': '0.21', 'lle': '5.69', ...",CHEMBL3237875,,CHEMBL3237875,6.33,False,http://www.openphacts.org/units/Nanomolar,3466608,=,1,True,=,,IC50,nM,,472.7,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,472.7


In [None]:
# Creating a df with not null values in these two columns
dft = df[df.standard_value.notna()]
dft = dft[df.canonical_smiles.notna()]
dft

  This is separate from the ipykernel package so we can avoid doing imports until


Unnamed: 0,activity_comment,activity_id,activity_properties,assay_chembl_id,assay_description,assay_type,assay_variant_accession,assay_variant_mutation,bao_endpoint,bao_format,bao_label,canonical_smiles,data_validity_comment,data_validity_description,document_chembl_id,document_journal,document_year,ligand_efficiency,molecule_chembl_id,molecule_pref_name,parent_molecule_chembl_id,pchembl_value,potential_duplicate,qudt_units,record_id,relation,src_id,standard_flag,standard_relation,standard_text_value,standard_type,standard_units,standard_upper_value,standard_value,target_chembl_id,target_organism,target_pref_name,target_tax_id,text_value,toid,type,units,uo_units,upper_value,value
0,,1709326,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N[C@@H](...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '12.18', 'le': '0.24', 'lle': '5.13', ...",CHEMBL381735,,CHEMBL381735,8.62,False,http://www.openphacts.org/units/Nanomolar,471603,=,1,True,=,,IC50,nM,,2.4,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.0024
1,,1709327,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N1CCC[C@...,Outside typical range,Values for this activity type are unusually la...,CHEMBL1147675,J. Med. Chem.,2006,,CHEMBL207670,,CHEMBL207670,,False,http://www.openphacts.org/units/Nanomolar,471604,=,1,True,=,,IC50,nM,,150000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,150.0
2,,1709328,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(=O)N[C@@H](CCC(=O)OC(C)(C)C)C(=O)N[C@@H](C)...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '13.45', 'le': '0.27', 'lle': '5.38', ...",CHEMBL383529,,CHEMBL383529,6.58,False,http://www.openphacts.org/units/Nanomolar,471605,=,1,True,=,,IC50,nM,,260.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.26
3,,1709330,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '14.08', 'le': '0.28', 'lle': '5.27', ...",CHEMBL207336,,CHEMBL207336,7.77,False,http://www.openphacts.org/units/Nanomolar,471606,=,1,True,=,,IC50,nM,,17.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.017
4,,1709331,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '14.12', 'le': '0.28', 'lle': '5.21', ...",CHEMBL208015,,CHEMBL208015,8.21,False,http://www.openphacts.org/units/Nanomolar,471607,=,1,True,=,,IC50,nM,,6.1,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.0061
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1159,,20606995,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,C[C@]1(C(=O)[C@H](Cc2ccccc2)NC(=O)[C@H](CO)NC(...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4100295,,CHEMBL4100295,,False,http://www.openphacts.org/units/Nanomolar,3466569,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1160,,20606996,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(=O)NCC(=O)N1CCC[C@H]1C(=O)N[C@@H](Cc1ccccc1...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4646371,,CHEMBL4646371,,False,http://www.openphacts.org/units/Nanomolar,3466570,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1161,,20606997,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@@H]...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4649310,,CHEMBL4649310,,False,http://www.openphacts.org/units/Nanomolar,3466597,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1162,,20606998,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,COc1ccc(C[C@H](NC(=O)[C@H](C)NC(=O)CN2CCOCC2)C...,,,CHEMBL4602696,J Med Chem,2020,"{'bei': '10.89', 'le': '0.21', 'lle': '5.69', ...",CHEMBL3237875,,CHEMBL3237875,6.33,False,http://www.openphacts.org/units/Nanomolar,3466608,=,1,True,=,,IC50,nM,,472.7,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,472.7


In [None]:
len(dft.canonical_smiles.unique())

818

In [None]:
# droping duplicate values
dfdd = dft.drop_duplicates(['canonical_smiles'])
dfdd

Unnamed: 0,activity_comment,activity_id,activity_properties,assay_chembl_id,assay_description,assay_type,assay_variant_accession,assay_variant_mutation,bao_endpoint,bao_format,bao_label,canonical_smiles,data_validity_comment,data_validity_description,document_chembl_id,document_journal,document_year,ligand_efficiency,molecule_chembl_id,molecule_pref_name,parent_molecule_chembl_id,pchembl_value,potential_duplicate,qudt_units,record_id,relation,src_id,standard_flag,standard_relation,standard_text_value,standard_type,standard_units,standard_upper_value,standard_value,target_chembl_id,target_organism,target_pref_name,target_tax_id,text_value,toid,type,units,uo_units,upper_value,value
0,,1709326,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N[C@@H](...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '12.18', 'le': '0.24', 'lle': '5.13', ...",CHEMBL381735,,CHEMBL381735,8.62,False,http://www.openphacts.org/units/Nanomolar,471603,=,1,True,=,,IC50,nM,,2.4,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.0024
1,,1709327,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N1CCC[C@...,Outside typical range,Values for this activity type are unusually la...,CHEMBL1147675,J. Med. Chem.,2006,,CHEMBL207670,,CHEMBL207670,,False,http://www.openphacts.org/units/Nanomolar,471604,=,1,True,=,,IC50,nM,,150000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,150.0
2,,1709328,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(=O)N[C@@H](CCC(=O)OC(C)(C)C)C(=O)N[C@@H](C)...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '13.45', 'le': '0.27', 'lle': '5.38', ...",CHEMBL383529,,CHEMBL383529,6.58,False,http://www.openphacts.org/units/Nanomolar,471605,=,1,True,=,,IC50,nM,,260.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.26
3,,1709330,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '14.08', 'le': '0.28', 'lle': '5.27', ...",CHEMBL207336,,CHEMBL207336,7.77,False,http://www.openphacts.org/units/Nanomolar,471606,=,1,True,=,,IC50,nM,,17.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.017
4,,1709331,[],CHEMBL861973,Inhibition of chymotrypsin-like proteasome act...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,,,CHEMBL1147675,J. Med. Chem.,2006,"{'bei': '14.12', 'le': '0.28', 'lle': '5.21', ...",CHEMBL208015,,CHEMBL208015,8.21,False,http://www.openphacts.org/units/Nanomolar,471607,=,1,True,=,,IC50,nM,,6.1,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,uM,UO_0000065,,0.0061
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1118,,19474854,[],CHEMBL4479408,Inhibition of catalytic activity of constituti...,B,,,BAO_0000190,BAO_0000219,cell-based format,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@H](...,,,CHEMBL4477237,J Med Chem,2016,"{'bei': '13.06', 'le': '0.24', 'lle': '3.88', ...",CHEMBL4519899,,CHEMBL4519899,8.52,False,http://www.openphacts.org/units/Nanomolar,3256554,=,1,True,=,,IC50,nM,,3.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50(app),uM,UO_0000065,,0.003
1120,,19474856,[],CHEMBL4479408,Inhibition of catalytic activity of constituti...,B,,,BAO_0000190,BAO_0000219,cell-based format,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@@H]...,,,CHEMBL4477237,J Med Chem,2016,,CHEMBL4555159,,CHEMBL4555159,,False,http://www.openphacts.org/units/Nanomolar,3256552,<,1,True,<,,IC50,nM,,10.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50(app),nM,UO_0000065,,10.0
1160,,20606996,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(=O)NCC(=O)N1CCC[C@H]1C(=O)N[C@@H](Cc1ccccc1...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4646371,,CHEMBL4646371,,False,http://www.openphacts.org/units/Nanomolar,3466570,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0
1161,,20606997,[],CHEMBL4605214,Inhibition of Beta5 in human 20S immunoproteas...,B,,,BAO_0000190,BAO_0000357,single protein format,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@@H]...,,,CHEMBL4602696,J Med Chem,2020,,CHEMBL4649310,,CHEMBL4649310,,False,http://www.openphacts.org/units/Nanomolar,3466597,>,1,True,>,,IC50,nM,,10000.0,CHEMBL4662,Homo sapiens,Proteasome Macropain subunit MB1,9606,,,IC50,nM,UO_0000065,,10000.0


In [None]:
# Target Columns
selection = ['molecule_chembl_id','canonical_smiles','standard_value']
dftc = dfdd[selection]
dftc

Unnamed: 0,molecule_chembl_id,canonical_smiles,standard_value
0,CHEMBL381735,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N[C@@H](...,2.4
1,CHEMBL207670,CC[C@H](C)[C@H](NC(=O)OCc1ccccc1)C(=O)N1CCC[C@...,150000.0
2,CHEMBL383529,CC(=O)N[C@@H](CCC(=O)OC(C)(C)C)C(=O)N[C@@H](C)...,260.0
3,CHEMBL207336,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,17.0
4,CHEMBL208015,CC(C)C[C@@H](/C=C/S(C)(=O)=O)NC(=O)[C@H](C)NC(...,6.1
...,...,...,...
1118,CHEMBL4519899,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@H](...,3.0
1120,CHEMBL4555159,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@@H]...,10.0
1160,CHEMBL4646371,CC(=O)NCC(=O)N1CCC[C@H]1C(=O)N[C@@H](Cc1ccccc1...,10000.0
1161,CHEMBL4649310,CC(C)C[C@H](NC(=O)[C@H](Cc1ccccc1)NC(=O)[C@@H]...,10000.0


In [None]:
# saving data preparation df
dftc.to_csv('psmb5_first_data.csv', index=False)