In [1]:
# HCASE Experiments Drugs and CANVASS into HCASE NatProd
#
# Author: Gergely Zahoranszky-Kohalmi, PhD
#
# Email: gergely.zahoranszky-kohalmi@nih.gov
#
# Organization: National Center for Advancing Translational Sciences (NCATS/NIH)
#

In [2]:
import hcase
import pandas as pd

import rdkit
from rdkit import Chem

import matplotlib
#matplotlib.use('agg')
import matplotlib.pyplot as plt
import seaborn as sns

In [3]:
# Config section



fname_reference_scaffolds = '../data/STD_ML_ChEMBL23_NatProd_10132017.txt'
fname_structures_drugs = '../data/STD_drugbank_approved_structures_v5.txt'
fname_structures_canvass = '../data/STD_FINAL_20170525_ML_CANVASS_deduplicated.txt'



fname_out_space = '../data/natprod_hc_space.tab'
fname_out_embedding_canvass = '../data/canvass_emb_hcase_natprod_bms_dim_2.tab'
fname_out_embedding_drugs = '../data/drugs_emb_hcase_natprod_bms_dim_2.tab'



n_dim = 2



use_precomputed_reference_space = False





In [4]:
# Import datasets

df_ref_scaffolds = pd.read_csv (fname_reference_scaffolds, sep = '\t')
df_structures_canvass = pd.read_csv (fname_structures_canvass, sep = '\t')
df_structures_drugs = pd.read_csv (fname_structures_drugs, sep = '\t')


In [5]:
# Functions

def smiles2inchikey (smiles):
    if smiles == 'NA':
        inchi = 'NA'
    else:
        try:
            mol = Chem.MolFromSmiles(smiles)
            inchi = Chem.MolToInchi (mol)
        except:
            inchi = 'NA'

    if inchi == 'NA':
        inchikey = 'NA'
    else:
        try:
            inchikey = Chem.InchiToInchiKey (inchi)
        except:
            inchikey = 'NA'
    
    return (inchikey)    


In [6]:
# Clean-up datasets

# This is just to make the data structure compliant which HCASE which at this point expects a set of scaffolds,
# but here a set if compounds are provided. It's not an issue in the workflow, as the train method of hcase 
# actually generates the unique BM-scaffold set from the compounds. 
df_ref_scaffolds = df_structures_canvass.rename (columns = {'Structure': 'structure', 'ID': 'pattern_id'})
df_ref_scaffolds['hash'] = df_ref_scaffolds.apply (lambda x: smiles2inchikey(x['structure']), axis = 1)
df_ref_scaffolds['ptype'] = 'scaffold'



df_structures_canvass = df_structures_canvass.rename (columns = {'Structure': 'structure', 'ID': 'id'})
df_structures_drugs = df_structures_drugs.rename (columns = {'Structure': 'structure', 'ID': 'id'})




[01:22:39] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:39] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:39] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:39] Explicit valence for atom # 11 N, 4, is greater than permitted


In [7]:
# Create NatProd Scaffold space

if not use_precomputed_reference_space:

    
    df_hcase_space = hcase.train (df_ref_scaffolds)
    df_hcase_space.to_csv (fname_out_space, sep = '\t', index = False)

else:
    
    df_hcase_space = pd.read_csv (fname_out_space, sep = '\t')


[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Can't kekulize mol.  Unkekulized atoms: 1 2 3 13 14 15 28 29 31

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Can't kekulize mol.  Unkekulized atoms: 1 2 3 12 13 14 16 28 30

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Can't kekulize mol.  Unkekulized atoms: 1 2 3 12 13 25 27 28 30

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Can't kekulize mol.  Unkekulized atoms: 1 2 3 24 25 26 39 40 42

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Can't kekulize mol.  Unkekulized atoms: 10 11 21 22 23 25 26 28 29

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'




[01:22:39] Can't kekulize mol.  Unkekulized atoms: 5 6 15 16 17 19 20 22 23

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Can't kekulize mol.  Unkekulized atoms: 4 5 7 8 10 11 13 14 23

[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:39] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:39] SMILES Parse Error: syntax error for input: 'NA'
[01:22:39] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:40] 



[01:22:40] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:40] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:40] SMILES Parse Error: syntax error for input: 'NA'
[01:22:40] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:40] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 15 17 19

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'




[01:22:40] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:40] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:40] SMILES Parse Error: syntax error for input: 'NA'
[01:22:40] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:40] Can't kekulize mol.  Unkekulized atoms: 12 13 14 15 16 18 34 37 38

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'




[01:22:40] Can't kekulize mol.  Unkekulized atoms: 4 5 6 7 8 9 10 12 13

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'
[01:22:40] Can't kekulize mol.  Unkekulized atoms: 3 4 6 7 9 10 13 14 15 24 25 27 28 30 31

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'
[01:22:40] Can't kekulize mol.  Unkekulized atoms: 20 21 23 24 26 27 29 30 40

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'
[01:22:40] Can't kekulize mol.  Unkekulized atoms: 29 30 31 32 33 34 37 39 40

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'




[01:22:40] Can't kekulize mol.  Unkekulized atoms: 10 11 13 19 21 22 24 25 26 28 29 30 32

[01:22:40] SMILES Parse Error: syntax error for input: 'NA'
[01:22:41] Can't kekulize mol.  Unkekulized atoms: 7 8 10 18 20

[01:22:41] SMILES Parse Error: syntax error for input: 'NA'




[01:22:41] Can't kekulize mol.  Unkekulized atoms: 17 18 19 20 30

[01:22:41] SMILES Parse Error: syntax error for input: 'NA'




[01:22:42] Can't kekulize mol.  Unkekulized atoms: 2 3 5 6 8 15 16 18 19

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Can't kekulize mol.  Unkekulized atoms: 2 3 5 6 8 9 11 12 20

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Can't kekulize mol.  Unkekulized atoms: 2 3 4 5 6 7 10 11 13

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'




[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Can't kekulize mol.  Unkekulized atoms: 3 4 5 6 7

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'




[01:22:42] Can't kekulize mol.  Unkekulized atoms: 2 3 4 5 6 7 24 27 28

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Explicit valence for atom # 11 N, 4, is greater than permitted
[01:22:42] Explicit valence for atom # 11 N, 4, is greater than permitted
[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Explicit valence for atom # 11 N, 4, is greater than permitted
[01:22:42] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 8 13 14 16

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Can't kekulize mol.  Unkekulized atoms: 2 3 4 5 7 8 11 14 17 20 21 23 24

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:42] Can't kekulize mol.  Unkekulized atoms: 6 8 9 10 13 14 17 18 20

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'




[01:22:42] Can't kekulize mol.  Unkekulized atoms: 1 2 4 14 15 16 18 19 20

[01:22:42] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] Can't kekulize mol.  Unkekulized atoms: 3 4 5 7 9 13 15 17 19 23

[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 14 16 17 18

[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] Can't kekulize mol.  Unkekulized atoms: 2 3 4 6 7 8 9 10 11 12 14 15 16

[01:22:43] SMILES Parse Error: syntax error for input: 'NA'




[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] SMILES Parse Error: syntax error for input: 'NA'
[01:22:43] SMILES Parse Error: syntax error for input: 'NA'




[01:22:43] SMILES Parse Error: syntax error for input: 'NA'


[*] Number of scaffolds in input:
343
[*] Number of unique reference scaffolds:
292


[01:22:43] SMILES Parse Error: syntax error for input: 'NA'


In [8]:
# Embed structures into HCASE space

    
df_embedded_canvass = hcase.embed (df_hcase_space, df_structures_canvass, n_dim)
df_embedded_drugs = hcase.embed (df_hcase_space, df_structures_drugs, n_dim)



[01:22:44] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:44] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:44] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:44] Explicit valence for atom # 11 N, 4, is greater than permitted
[01:22:44] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 21 22 23

[01:22:44] SMILES Parse Error: syntax error for input: 'NA'
[01:22:44] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 21 22

[01:22:44] SMILES Parse Error: syntax error for input: 'NA'
[01:22:44] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 19 20 21 22

[01:22:44] SMILES Parse Error: syntax error for input: 'NA'
[01:22:44] Can't kekulize mol.  Unkekulized atoms: 1 2 3 18 19 20 28 29 30

[01:22:44] SMILES Parse Error: syntax error for input: 'NA'
[01:22:44] Can't kekulize mol.  Unkekulized atoms: 1 2 18 26 27 28 29 30 31

[01:22:44] SMILES Parse Error: syntax error for input: 'NA'
[01:22:44] Can't kekulize 



[01:22:44] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:22:44] SMILES Parse Error: syntax error for input: 'NA'




[01:22:45] Can't kekulize mol.  Unkekulized atoms: 3 4 5 6 7 8 16 17 19

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'
[01:22:45] Can't kekulize mol.  Unkekulized atoms: 8 9 10 11 12 14 16 17 18

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'




[01:22:45] Can't kekulize mol.  Unkekulized atoms: 9 10 11 12 13 14 16 17 18 19 20 21 24 25 26

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'
[01:22:45] Can't kekulize mol.  Unkekulized atoms: 17 18 19 20 21 22 24 25 33

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'
[01:22:45] Can't kekulize mol.  Unkekulized atoms: 2 3 4 5 6 8 10 11 12

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'
[01:22:45] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 9 10 11 12 13 14

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'
[01:22:45] Can't kekulize mol.  Unkekulized atoms: 2 3 4 11 13

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'




[01:22:45] Can't kekulize mol.  Unkekulized atoms: 1 3 19 20 21

[01:22:45] SMILES Parse Error: syntax error for input: 'NA'




[01:22:46] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:22:46] SMILES Parse Error: syntax error for input: 'NA'




[01:22:46] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:22:46] SMILES Parse Error: syntax error for input: 'NA'
[01:22:46] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 15 16

[01:22:46] SMILES Parse Error: syntax error for input: 'NA'
[01:22:46] Can't kekulize mol.  Unkekulized atoms: 5 6 7 9 11

[01:22:46] SMILES Parse Error: syntax error for input: 'NA'
[01:22:46] Can't kekulize mol.  Unkekulized atoms: 3 4 5 6 7 8 9 10 12

[01:22:46] SMILES Parse Error: syntax error for input: 'NA'




[01:22:46] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 9 10

[01:22:46] SMILES Parse Error: syntax error for input: 'NA'




[01:22:47] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 9 10 11 12 13 14

[01:22:47] SMILES Parse Error: syntax error for input: 'NA'
[01:22:47] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:22:47] SMILES Parse Error: syntax error for input: 'NA'
[01:22:47] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:22:47] SMILES Parse Error: syntax error for input: 'NA'
[01:22:47] Can't kekulize mol.  Unkekulized atoms: 2 3 4 5 8 11 13 15 16 17

[01:22:47] SMILES Parse Error: syntax error for input: 'NA'
[01:22:47] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:22:47] SMILES Parse Error: syntax error for input: 'NA'
[01:22:47] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 9 10 11 12 13 14

[01:22:47] SMILES Parse Error: syntax error for input: 'NA'






[*] Number of input structures: 332
[*] Number of structures for which scaffold_key was generated: 304
[*] Finding closest reference scaffold for structure 1 out of 304 .
[*] Finding closest reference scaffold for structure 2 out of 304 .
[*] Finding closest reference scaffold for structure 3 out of 304 .
[*] Finding closest reference scaffold for structure 4 out of 304 .
[*] Finding closest reference scaffold for structure 5 out of 304 .
[*] Finding closest reference scaffold for structure 6 out of 304 .
[*] Finding closest reference scaffold for structure 7 out of 304 .
[*] Finding closest reference scaffold for structure 8 out of 304 .
[*] Finding closest reference scaffold for structure 9 out of 304 .
[*] Finding closest reference scaffold for structure 10 out of 304 .
[*] Finding closest reference scaffold for structure 11 out of 304 .
[*] Finding closest reference scaffold for structure 12 out of 304 .
[*] Finding closest reference scaffold for structure 13 out of 304 .
[*] Findi

[*] Finding closest reference scaffold for structure 122 out of 304 .
[*] Finding closest reference scaffold for structure 123 out of 304 .
[*] Finding closest reference scaffold for structure 124 out of 304 .
[*] Finding closest reference scaffold for structure 125 out of 304 .
[*] Finding closest reference scaffold for structure 126 out of 304 .
[*] Finding closest reference scaffold for structure 127 out of 304 .
[*] Finding closest reference scaffold for structure 128 out of 304 .
[*] Finding closest reference scaffold for structure 129 out of 304 .
[*] Finding closest reference scaffold for structure 130 out of 304 .
[*] Finding closest reference scaffold for structure 131 out of 304 .
[*] Finding closest reference scaffold for structure 132 out of 304 .
[*] Finding closest reference scaffold for structure 133 out of 304 .
[*] Finding closest reference scaffold for structure 134 out of 304 .
[*] Finding closest reference scaffold for structure 135 out of 304 .
[*] Finding closest 

[*] Finding closest reference scaffold for structure 248 out of 304 .
[*] Finding closest reference scaffold for structure 249 out of 304 .
[*] Finding closest reference scaffold for structure 250 out of 304 .
[*] Finding closest reference scaffold for structure 251 out of 304 .
[*] Finding closest reference scaffold for structure 252 out of 304 .
[*] Finding closest reference scaffold for structure 253 out of 304 .
[*] Finding closest reference scaffold for structure 254 out of 304 .
[*] Finding closest reference scaffold for structure 255 out of 304 .
[*] Finding closest reference scaffold for structure 256 out of 304 .
[*] Finding closest reference scaffold for structure 257 out of 304 .
[*] Finding closest reference scaffold for structure 258 out of 304 .
[*] Finding closest reference scaffold for structure 259 out of 304 .
[*] Finding closest reference scaffold for structure 260 out of 304 .
[*] Finding closest reference scaffold for structure 261 out of 304 .
[*] Finding closest 

[01:22:51] Explicit valence for atom # 21 N, 4, is greater than permitted
[01:22:51] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:51] Explicit valence for atom # 6 N, 4, is greater than permitted
[01:22:51] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:51] Explicit valence for atom # 12 N, 4, is greater than permitted
[01:22:51] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:51] Explicit valence for atom # 3 O, 3, is greater than permitted
[01:22:52] Explicit valence for atom # 17 N, 4, is greater than permitted
[01:22:52] Explicit valence for atom # 11 N, 4, is greater than permitted
[01:22:52] Explicit valence for atom # 1 N, 4, is greater than permitted
[01:22:52] Explicit valence for atom # 2 N, 4, is greater than permitted
[01:22:52] Explicit valence for atom # 20 N, 4, is greater than permitted
[01:22:52] Explicit valence for atom # 17 N, 4, is greater than permitted
[01:22:52] Explicit valence for atom # 25 N, 

[01:22:53] Explicit valence for atom # 46 N, 4, is greater than permitted
[01:22:53] Explicit valence for atom # 16 N, 4, is greater than permitted
[01:22:53] Explicit valence for atom # 1 O, 3, is greater than permitted
[01:22:53] Explicit valence for atom # 8 N, 4, is greater than permitted
[01:22:53] Explicit valence for atom # 9 N, 4, is greater than permitted
[01:22:53] Explicit valence for atom # 0 N, 4, is greater than permitted
[01:22:53] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6

[01:22:53] SMILES Parse Error: syntax error for input: 'NA'
[01:22:53] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 9 10 11 12 13

[01:22:53] SMILES Parse Error: syntax error for input: 'NA'
[01:22:53] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 17 18

[01:22:53] SMILES Parse Error: syntax error for input: 'NA'




[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'
[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 2 3 20 21 22 24

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'




[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 2 3 8 9 10 20 21 22

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'
[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 11

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'




[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'
[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8 9 10





[01:22:54] SMILES Parse Error: syntax error for input: 'NA'
[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'
[01:22:54] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 16 17

[01:22:54] SMILES Parse Error: syntax error for input: 'NA'
[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 7 8 9

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'




[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'
[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 9

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'
[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'
[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'
[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'




[01:22:55] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:22:55] SMILES Parse Error: syntax error for input: 'NA'




[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 8 9

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 7 8 9 10 12 13 15

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'




[01:22:56] Can't kekulize mol.  Unkekulized atoms: 10 13 14 15 16 17 18

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'




[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 8 9 10 17 18 19

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5





[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:56] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 8 10 11 12

[01:22:56] SMILES Parse Error: syntax error for input: 'NA'
[01:22:57] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 7 8 9

[01:22:57] SMILES Parse Error: syntax error for input: 'NA'




[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 14 16

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 18 19 20 21 22 23

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'




[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8 9 10

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 20 21 22

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'




[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 9 10 11 13 14 15





[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:58] Can't kekulize mol.  Unkekulized atoms: 1 2 20 21 22

[01:22:58] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 3 4 5 7 9 13 14 15 16 17 33 34 35 36 37

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 9 10

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'




[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 7 8 9

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'




[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 9 10

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16 17 18 19 20

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 21 22 23 24

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'




[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:22:59] Can't kekulize mol.  Unkekulized atoms: 1 2 8 9 10 11 12 13 14

[01:22:59] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'




[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'




[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8 9 10

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'




[01:23:00] Can't kekulize mol.  Unkekulized atoms: 21 22 23 25 26 28 29 30 31 32 60 61 62

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 8 16

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'




[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 9 26

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 7 8 9

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 9 10 11 12 13 14

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 3 4 5 7 9 13 14 15 16 17 18 19 20 21 22

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:00] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 9

[01:23:00] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 2 3 8 9 10 17 18 19

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 3 4 5 6 7 8 16 17 19

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 2 







[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 11 12 13 14 15 16 18 19 27

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 12 13

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'




[01:23:01] Can't kekulize mol.  Unkekulized atoms: 5 6 7 8 9 11 12 17 18

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'
[01:23:01] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:23:01] SMILES Parse Error: syntax error for input: 'NA'




[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'
[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'
[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 2 3 8 9 10 17 18 19

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'
[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'
[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'
[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'
[01:23:02] Can't kekulize mol.  Unkekulized atoms: 1 2 20 21 22

[01:23:02] SMILES Parse Error: syntax error for input: 'NA'




[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 2 3 14 15

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'




[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 8 9

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'




[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 11 12 13 14 15 16

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'
[01:23:03] Can't kekulize mol.  Unkekulized atoms: 3 4 5 6 7 8 10 11 18

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'
[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'
[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 2 3

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'




[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 11

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'
[01:23:03] Can't kekulize mol.  Unkekulized atoms: 1 2 3

[01:23:03] SMILES Parse Error: syntax error for input: 'NA'




[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 7 8 9

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'
[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 2 3 32 33 34 35 36 37 38 39 40

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'
[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'
[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 8 10 11 12

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'
[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 14 15 16

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'








[01:23:04] Can't kekulize mol.  Unkekulized atoms: 8 9 11

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'
[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6 7 8

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'




[01:23:04] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 9 10 11 12 13 14

[01:23:04] SMILES Parse Error: syntax error for input: 'NA'
[01:23:05] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 18 19 20 21

[01:23:05] SMILES Parse Error: syntax error for input: 'NA'
[01:23:05] Can't kekulize mol.  Unkekulized atoms: 1 2 3 349 350

[01:23:05] SMILES Parse Error: syntax error for input: 'NA'
[01:23:05] Can't kekulize mol.  Unkekulized atoms: 1 2 3 18

[01:23:05] SMILES Parse Error: syntax error for input: 'NA'








[01:23:05] Can't kekulize mol.  Unkekulized atoms: 1 2 3 22 23 24 26

[01:23:05] SMILES Parse Error: syntax error for input: 'NA'
[01:23:06] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6

[01:23:06] SMILES Parse Error: syntax error for input: 'NA'




[01:23:06] Can't kekulize mol.  Unkekulized atoms: 1 2 3

[01:23:06] SMILES Parse Error: syntax error for input: 'NA'




[01:23:06] Can't kekulize mol.  Unkekulized atoms: 1 2 3 8 9 10 18 19 20

[01:23:06] SMILES Parse Error: syntax error for input: 'NA'
[01:23:06] Can't kekulize mol.  Unkekulized atoms: 10 11 12 15 25

[01:23:06] SMILES Parse Error: syntax error for input: 'NA'




[01:23:07] Can't kekulize mol.  Unkekulized atoms: 9 10 12 13 14 15 16 17 18

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 4 5 7

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'




[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 13 14

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 2 9 10 17

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'




[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 14 20

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 10 11 13 14 15

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 2 3 21

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'




[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 6

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 29 30 31

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'
[01:23:07] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15

[01:23:07] SMILES Parse Error: syntax error for input: 'NA'




[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'




[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 8 9 10 20 21 22

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 8 9

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 21 22

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'




[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 3 5 7 8 9

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6 7 8 16 17

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'




[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 28 29

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 21

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 3 4

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 3 4 5 18 19 20 21 22 23

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'




[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 10

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 3 5 6 7 8

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:08] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5

[01:23:08] SMILES Parse Error: syntax error for input: 'NA'
[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 3 10

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'




[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'
[01:23:09] Can't kekulize mol.  Unkekulized atoms: 7 8 9 12

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'
[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'
[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 14 15 16

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'
[



[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 7 11 12 13 21 22 23

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'
[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 2 3 5 6

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'




[01:23:09] Can't kekulize mol.  Unkekulized atoms: 1 2 3 11 12 13 18 19 20

[01:23:09] SMILES Parse Error: syntax error for input: 'NA'
[01:23:10] Can't kekulize mol.  Unkekulized atoms: 1 2 3 4 5 6 14 15 16

[01:23:10] SMILES Parse Error: syntax error for input: 'NA'






[*] Number of input structures: 1623
[*] Number of structures for which scaffold_key was generated: 1474
[*] Finding closest reference scaffold for structure 1 out of 1474 .
[*] Finding closest reference scaffold for structure 2 out of 1474 .
[*] Finding closest reference scaffold for structure 3 out of 1474 .
[*] Finding closest reference scaffold for structure 4 out of 1474 .
[*] Finding closest reference scaffold for structure 5 out of 1474 .
[*] Finding closest reference scaffold for structure 6 out of 1474 .
[*] Finding closest reference scaffold for structure 7 out of 1474 .
[*] Finding closest reference scaffold for structure 8 out of 1474 .
[*] Finding closest reference scaffold for structure 9 out of 1474 .
[*] Finding closest reference scaffold for structure 10 out of 1474 .
[*] Finding closest reference scaffold for structure 11 out of 1474 .
[*] Finding closest reference scaffold for structure 12 out of 1474 .
[*] Finding closest reference scaffold for structure 13 out of 1

[*] Finding closest reference scaffold for structure 128 out of 1474 .
[*] Finding closest reference scaffold for structure 129 out of 1474 .
[*] Finding closest reference scaffold for structure 130 out of 1474 .
[*] Finding closest reference scaffold for structure 131 out of 1474 .
[*] Finding closest reference scaffold for structure 132 out of 1474 .
[*] Finding closest reference scaffold for structure 133 out of 1474 .
[*] Finding closest reference scaffold for structure 134 out of 1474 .
[*] Finding closest reference scaffold for structure 135 out of 1474 .
[*] Finding closest reference scaffold for structure 136 out of 1474 .
[*] Finding closest reference scaffold for structure 137 out of 1474 .
[*] Finding closest reference scaffold for structure 138 out of 1474 .
[*] Finding closest reference scaffold for structure 139 out of 1474 .
[*] Finding closest reference scaffold for structure 140 out of 1474 .
[*] Finding closest reference scaffold for structure 141 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 255 out of 1474 .
[*] Finding closest reference scaffold for structure 256 out of 1474 .
[*] Finding closest reference scaffold for structure 257 out of 1474 .
[*] Finding closest reference scaffold for structure 258 out of 1474 .
[*] Finding closest reference scaffold for structure 259 out of 1474 .
[*] Finding closest reference scaffold for structure 260 out of 1474 .
[*] Finding closest reference scaffold for structure 261 out of 1474 .
[*] Finding closest reference scaffold for structure 262 out of 1474 .
[*] Finding closest reference scaffold for structure 263 out of 1474 .
[*] Finding closest reference scaffold for structure 264 out of 1474 .
[*] Finding closest reference scaffold for structure 265 out of 1474 .
[*] Finding closest reference scaffold for structure 266 out of 1474 .
[*] Finding closest reference scaffold for structure 267 out of 1474 .
[*] Finding closest reference scaffold for structure 268 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 382 out of 1474 .
[*] Finding closest reference scaffold for structure 383 out of 1474 .
[*] Finding closest reference scaffold for structure 384 out of 1474 .
[*] Finding closest reference scaffold for structure 385 out of 1474 .
[*] Finding closest reference scaffold for structure 386 out of 1474 .
[*] Finding closest reference scaffold for structure 387 out of 1474 .
[*] Finding closest reference scaffold for structure 388 out of 1474 .
[*] Finding closest reference scaffold for structure 389 out of 1474 .
[*] Finding closest reference scaffold for structure 390 out of 1474 .
[*] Finding closest reference scaffold for structure 391 out of 1474 .
[*] Finding closest reference scaffold for structure 392 out of 1474 .
[*] Finding closest reference scaffold for structure 393 out of 1474 .
[*] Finding closest reference scaffold for structure 394 out of 1474 .
[*] Finding closest reference scaffold for structure 395 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 509 out of 1474 .
[*] Finding closest reference scaffold for structure 510 out of 1474 .
[*] Finding closest reference scaffold for structure 511 out of 1474 .
[*] Finding closest reference scaffold for structure 512 out of 1474 .
[*] Finding closest reference scaffold for structure 513 out of 1474 .
[*] Finding closest reference scaffold for structure 514 out of 1474 .
[*] Finding closest reference scaffold for structure 515 out of 1474 .
[*] Finding closest reference scaffold for structure 516 out of 1474 .
[*] Finding closest reference scaffold for structure 517 out of 1474 .
[*] Finding closest reference scaffold for structure 518 out of 1474 .
[*] Finding closest reference scaffold for structure 519 out of 1474 .
[*] Finding closest reference scaffold for structure 520 out of 1474 .
[*] Finding closest reference scaffold for structure 521 out of 1474 .
[*] Finding closest reference scaffold for structure 522 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 634 out of 1474 .
[*] Finding closest reference scaffold for structure 635 out of 1474 .
[*] Finding closest reference scaffold for structure 636 out of 1474 .
[*] Finding closest reference scaffold for structure 637 out of 1474 .
[*] Finding closest reference scaffold for structure 638 out of 1474 .
[*] Finding closest reference scaffold for structure 639 out of 1474 .
[*] Finding closest reference scaffold for structure 640 out of 1474 .
[*] Finding closest reference scaffold for structure 641 out of 1474 .
[*] Finding closest reference scaffold for structure 642 out of 1474 .
[*] Finding closest reference scaffold for structure 643 out of 1474 .
[*] Finding closest reference scaffold for structure 644 out of 1474 .
[*] Finding closest reference scaffold for structure 645 out of 1474 .
[*] Finding closest reference scaffold for structure 646 out of 1474 .
[*] Finding closest reference scaffold for structure 647 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 759 out of 1474 .
[*] Finding closest reference scaffold for structure 760 out of 1474 .
[*] Finding closest reference scaffold for structure 761 out of 1474 .
[*] Finding closest reference scaffold for structure 762 out of 1474 .
[*] Finding closest reference scaffold for structure 763 out of 1474 .
[*] Finding closest reference scaffold for structure 764 out of 1474 .
[*] Finding closest reference scaffold for structure 765 out of 1474 .
[*] Finding closest reference scaffold for structure 766 out of 1474 .
[*] Finding closest reference scaffold for structure 767 out of 1474 .
[*] Finding closest reference scaffold for structure 768 out of 1474 .
[*] Finding closest reference scaffold for structure 769 out of 1474 .
[*] Finding closest reference scaffold for structure 770 out of 1474 .
[*] Finding closest reference scaffold for structure 771 out of 1474 .
[*] Finding closest reference scaffold for structure 772 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 888 out of 1474 .
[*] Finding closest reference scaffold for structure 889 out of 1474 .
[*] Finding closest reference scaffold for structure 890 out of 1474 .
[*] Finding closest reference scaffold for structure 891 out of 1474 .
[*] Finding closest reference scaffold for structure 892 out of 1474 .
[*] Finding closest reference scaffold for structure 893 out of 1474 .
[*] Finding closest reference scaffold for structure 894 out of 1474 .
[*] Finding closest reference scaffold for structure 895 out of 1474 .
[*] Finding closest reference scaffold for structure 896 out of 1474 .
[*] Finding closest reference scaffold for structure 897 out of 1474 .
[*] Finding closest reference scaffold for structure 898 out of 1474 .
[*] Finding closest reference scaffold for structure 899 out of 1474 .
[*] Finding closest reference scaffold for structure 900 out of 1474 .
[*] Finding closest reference scaffold for structure 901 out of 1474 .
[*] Fi

[*] Finding closest reference scaffold for structure 1013 out of 1474 .
[*] Finding closest reference scaffold for structure 1014 out of 1474 .
[*] Finding closest reference scaffold for structure 1015 out of 1474 .
[*] Finding closest reference scaffold for structure 1016 out of 1474 .
[*] Finding closest reference scaffold for structure 1017 out of 1474 .
[*] Finding closest reference scaffold for structure 1018 out of 1474 .
[*] Finding closest reference scaffold for structure 1019 out of 1474 .
[*] Finding closest reference scaffold for structure 1020 out of 1474 .
[*] Finding closest reference scaffold for structure 1021 out of 1474 .
[*] Finding closest reference scaffold for structure 1022 out of 1474 .
[*] Finding closest reference scaffold for structure 1023 out of 1474 .
[*] Finding closest reference scaffold for structure 1024 out of 1474 .
[*] Finding closest reference scaffold for structure 1025 out of 1474 .
[*] Finding closest reference scaffold for structure 1026 out of

[*] Finding closest reference scaffold for structure 1140 out of 1474 .
[*] Finding closest reference scaffold for structure 1141 out of 1474 .
[*] Finding closest reference scaffold for structure 1142 out of 1474 .
[*] Finding closest reference scaffold for structure 1143 out of 1474 .
[*] Finding closest reference scaffold for structure 1144 out of 1474 .
[*] Finding closest reference scaffold for structure 1145 out of 1474 .
[*] Finding closest reference scaffold for structure 1146 out of 1474 .
[*] Finding closest reference scaffold for structure 1147 out of 1474 .
[*] Finding closest reference scaffold for structure 1148 out of 1474 .
[*] Finding closest reference scaffold for structure 1149 out of 1474 .
[*] Finding closest reference scaffold for structure 1150 out of 1474 .
[*] Finding closest reference scaffold for structure 1151 out of 1474 .
[*] Finding closest reference scaffold for structure 1152 out of 1474 .
[*] Finding closest reference scaffold for structure 1153 out of

[*] Finding closest reference scaffold for structure 1262 out of 1474 .
[*] Finding closest reference scaffold for structure 1263 out of 1474 .
[*] Finding closest reference scaffold for structure 1264 out of 1474 .
[*] Finding closest reference scaffold for structure 1265 out of 1474 .
[*] Finding closest reference scaffold for structure 1266 out of 1474 .
[*] Finding closest reference scaffold for structure 1267 out of 1474 .
[*] Finding closest reference scaffold for structure 1268 out of 1474 .
[*] Finding closest reference scaffold for structure 1269 out of 1474 .
[*] Finding closest reference scaffold for structure 1270 out of 1474 .
[*] Finding closest reference scaffold for structure 1271 out of 1474 .
[*] Finding closest reference scaffold for structure 1272 out of 1474 .
[*] Finding closest reference scaffold for structure 1273 out of 1474 .
[*] Finding closest reference scaffold for structure 1274 out of 1474 .
[*] Finding closest reference scaffold for structure 1275 out of

[*] Finding closest reference scaffold for structure 1386 out of 1474 .
[*] Finding closest reference scaffold for structure 1387 out of 1474 .
[*] Finding closest reference scaffold for structure 1388 out of 1474 .
[*] Finding closest reference scaffold for structure 1389 out of 1474 .
[*] Finding closest reference scaffold for structure 1390 out of 1474 .
[*] Finding closest reference scaffold for structure 1391 out of 1474 .
[*] Finding closest reference scaffold for structure 1392 out of 1474 .
[*] Finding closest reference scaffold for structure 1393 out of 1474 .
[*] Finding closest reference scaffold for structure 1394 out of 1474 .
[*] Finding closest reference scaffold for structure 1395 out of 1474 .
[*] Finding closest reference scaffold for structure 1396 out of 1474 .
[*] Finding closest reference scaffold for structure 1397 out of 1474 .
[*] Finding closest reference scaffold for structure 1398 out of 1474 .
[*] Finding closest reference scaffold for structure 1399 out of

In [9]:
df_embedded_canvass.to_csv (fname_out_embedding_canvass, sep = '\t', index = False)
df_embedded_drugs.to_csv (fname_out_embedding_drugs, sep = '\t', index = False)

In [10]:
# References:

# Ref: https://github.com/matplotlib/matplotlib/issues/3466/
# Ref: https://htmlcolorcodes.com/color-picker/
# Ref: https://iwatobipen.wordpress.com/2017/11/03/draw-high-quality-molecular-image-in-rdkit-rdkit/
# Ref: https://matplotlib.org/3.1.0/gallery/subplots_axes_and_figures/subplots_demo.html
# Ref: https://matplotlib.org/3.1.0/tutorials/colors/colormaps.html
# Ref: https://matplotlib.org/3.1.1/api/_as_gen/matplotlib.pyplot.scatter.html
# Ref: https://matplotlib.org/3.1.1/api/_as_gen/matplotlib.pyplot.title.html
# Ref: https://matplotlib.org/3.1.1/api/markers_api.html#module-matplotlib.markers
# Ref: https://matplotlib.org/3.1.1/gallery/shapes_and_collections/scatter.html
# Ref: https://matplotlib.org/3.1.1/tutorials/colors/colors.html
# Ref: https://python-graph-gallery.com/106-seaborn-style-on-matplotlib-plot/
# Ref: https://python-graph-gallery.com/122-multiple-lines-chart/
# Ref: https://python-graph-gallery.com/125-small-multiples-for-line-chart/
# Ref: https://python-graph-gallery.com/197-available-color-palettes-with-matplotlib/
# Ref: https://seaborn.pydata.org/examples/many_facets.html
# Ref: https://stackoverflow.com/questions/14432557/matplotlib-scatter-plot-with-different-text-at-each-data-point
# Ref: https://stackoverflow.com/questions/14827650/pyplot-scatter-plot-marker-size
# Ref: https://stackoverflow.com/questions/17682216/scatter-plot-and-color-mapping-in-python
# Ref: https://stackoverflow.com/questions/31686530/matplotlib-generate-a-new-graph-in-a-new-window-for-subsequent-program-runs/31686783
# Ref: https://stackoverflow.com/questions/39870642/matplotlib-how-to-plot-a-high-resolution-graph
# Ref: https://stackoverflow.com/questions/57568311/matplotlib-scatter-issue-with-python-3-x
# Ref: https://www.nceas.ucsb.edu/~frazier/RSpatialGuides/colorPaletteCheatsheet.pdf
# Ref: https://www.pluralsight.com/guides/choosing-color-palettes
# Ref: https://www.rdkit.org/docs/GettingStartedInPython.html
# Ref: https://www.rdkit.org/docs/source/rdkit.Chem.Draw.html
# Ref: https://www.science-emergence.com/Articles/How-to-create-a-scatter-plot-with-several-colors-in-matplotlib-/
