In [1]:
import pandas as pd

from mol_utils.structure_from_names import get_inchi_and_smiles_from_list_of_names
from mol_utils.utils import add_chembl_structural_alerts_column_to_df, add_scaffold_column_to_df, add_rdkit_fingerprint_column_to_df

In [2]:
names = ["acetaminophen", "cocaine"]
inchi, smiles, failed = get_inchi_and_smiles_from_list_of_names(names)
df = pd.DataFrame({"name": names, "inchi": inchi, "smiles": smiles})
df

Gathering inchi from sources: 100%|██████████| 2/2 [00:12<00:00,  6.47s/it]


Unnamed: 0,name,inchi,smiles
0,acetaminophen,InChI=1S/C8H9NO2/c1-6(10)9-7-2-4-8(11)5-3-7/h2...,CC(O)=Nc1ccc(O)cc1
1,cocaine,InChI=1S/C17H21NO4/c1-18-12-8-9-13(18)15(17(20...,COC(=O)[C@H]1[C@@H](OC(=O)c2ccccc2)C[C@@H]2CC[...


In [3]:
with_alerts = add_chembl_structural_alerts_column_to_df(df)
with_alerts

adding column chembl_structural_alerts: 100%|██████████| 2/2 [00:00<00:00, 364.37it/s]


Unnamed: 0,name,inchi,smiles,chembl_structural_alerts
0,acetaminophen,InChI=1S/C8H9NO2/c1-6(10)9-7-2-4-8(11)5-3-7/h2...,CC(O)=Nc1ccc(O)cc1,[imine]
1,cocaine,InChI=1S/C17H21NO4/c1-18-12-8-9-13(18)15(17(20...,COC(=O)[C@H]1[C@@H](OC(=O)c2ccccc2)C[C@@H]2CC[...,[Ester]


In [4]:
with_alerts_and_scaffold = add_scaffold_column_to_df(with_alerts)
with_alerts_and_scaffold

adding column scaffold: 100%|██████████| 2/2 [00:00<00:00, 1018.78it/s]


Unnamed: 0,name,inchi,smiles,chembl_structural_alerts,scaffold
0,acetaminophen,InChI=1S/C8H9NO2/c1-6(10)9-7-2-4-8(11)5-3-7/h2...,CC(O)=Nc1ccc(O)cc1,[imine],InChI=1S/C6H6/c1-2-4-6-5-3-1/h1-6H
1,cocaine,InChI=1S/C17H21NO4/c1-18-12-8-9-13(18)15(17(20...,COC(=O)[C@H]1[C@@H](OC(=O)c2ccccc2)C[C@@H]2CC[...,[Ester],InChI=1S/C14H17NO2/c16-14(10-4-2-1-3-5-10)17-1...


In [5]:
with_alerts_and_scaffold_and_fingerprint = add_rdkit_fingerprint_column_to_df(with_alerts_and_scaffold)
with_alerts_and_scaffold_and_fingerprint

adding column rdkit_fingerprint: 100%|██████████| 2/2 [00:00<00:00, 664.92it/s]


Unnamed: 0,name,inchi,smiles,chembl_structural_alerts,scaffold,rdkit_fingerprint
0,acetaminophen,InChI=1S/C8H9NO2/c1-6(10)9-7-2-4-8(11)5-3-7/h2...,CC(O)=Nc1ccc(O)cc1,[imine],InChI=1S/C6H6/c1-2-4-6-5-3-1/h1-6H,"[0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, ..."
1,cocaine,InChI=1S/C17H21NO4/c1-18-12-8-9-13(18)15(17(20...,COC(=O)[C@H]1[C@@H](OC(=O)c2ccccc2)C[C@@H]2CC[...,[Ester],InChI=1S/C14H17NO2/c16-14(10-4-2-1-3-5-10)17-1...,"[1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, ..."
