In [1]:
#imports 
import os
#import openff-qcsubmit
from openff.qcsubmit.factories import TorsiondriveDatasetFactory
from openforcefield.topology import Molecule
from openforcefield.utils.toolkits import RDKitToolkitWrapper, UndefinedStereochemistryError

# Datasets for WBO Interpolation

Lists of all the datasets used for WBO interpolation

In [64]:
#Datasets
enyl = ['CC=Cc1ccc(cc1)O' , 'CC=Cc1ccc(cc1)S' , 'CC=Cc1ccc(cc1)C(=O)O' , 'CC=Cc1ccc(cc1)N' , 'CC=Cc1ccc(cc1)[N+](C)(C)C' , 'CC=Cc1ccc(cc1)NC(=O)N' , 'CC=Cc1ccc(cc1)NC' , 'CC=Cc1ccc(cc1)NON' , 'CC=Cc1ccc(cc1)C#N' , 'CC=Cc1ccc(cc1)C' , 'CC=Cc1ccc(cc1)S(=O)O' , 'CCOc1ccc(cc1)C=CC' , 'CC=Cc1ccc(cc1)[O-]']

styrene= ['C=Cc1ccc(cc1)O' , 'C=Cc1ccc(cc1)S' , 'C=Cc1ccc(cc1)C(=O)O' , 'C=Cc1ccc(cc1)N' , 'C[N+](C)(C)c1ccc(cc1)C=C' , 'C=Cc1ccc(cc1)NC(=O)N' , 'CNc1ccc(cc1)C=C' , 'C=Cc1ccc(cc1)NON' , 'C=Cc1ccc(cc1)C#N' , 'Cc1ccc(cc1)C=C' , 'C=Cc1ccc(cc1)S(=O)O' , 'CCOc1ccc(cc1)C=C' , 'C=Cc1ccc(cc1)[O-]']
         
amide_primary= ['C(=O)(N)O' , 'C(=O)(N)S' , 'C(=O)(C(=O)O)N' , 'C(=O)(N)N' , 'C[N+](C)(C)C(=O)N' , 'C(=O)(N)NC(=O)N' , 'CNC(=O)N(C)C' , 'C(=O)(N)NON' , 'C(#N)C(=O)N' , 'CCC(=O)N' , 'CN(C)C(=O)S(=O)O' , 'CCOC(=O)N', 'C(=O)(N)[O-]']
    
amide_secondary=['CNC(=O)O' , 'CNC(=O)S' , 'CNC(=O)C(=O)O' , 'CNC(=O)N' , 'CNC(=O)[N+](C)(C)C' , 'CNC(=O)NC(=O)N' , 'CNC(=O)NC' , 'CNC(=O)NON' , 'CNC(=O)C#N' , 'CCC(=O)NC' , 'CNC(=O)S(=O)O' , 'CCOC(=O)NC' , 'CNC(=O)[O-]']

amide_tertiary = ['CN(C)C(=O)O' , 'CN(C)C(=O)S' , 'CN(C)C(=O)C(=O)O' , 'CN(C)C(=O)N' , 'CN(C)C(=O)[N+](C)(C)C' , 'CN(C)C(=O)NC(=O)N' , 'CNC(=O)N(C)C' , 'CN(C)C(=O)NON' , 'CN(C)C(=O)C#N' , 'CCC(=O)N(C)C' , 'CN(C)C(=O)S(=O)O' , 'CCOC(=O)N(C)C' , 'CN(C)C(=O)[O-]']

carbonyl=['C=CC(=O)O' , 'C=CC(=O)S' , 'C=CC(=O)C(=O)O' , 'C=CC(=O)N' , 'C[N+](C)(C)C(=O)C=C' , 'C=CC(=O)NC(=O)N' , 'CNC(=O)C=C' , 'C=CC(=O)NON' , 'C=CC(=O)C#N' , 'CCC(=O)C=C' , 'C=CC(=O)S(=O)O' , 'CCOC(=O)C=C' , 'C=CC(=O)[O-]']
   
carbamate= ['CN(C)C(=O)OO' , 'CN(C)C(=O)OS' , 'CN(C)C(=O)OC(=O)O' , 'CN(C)C(=O)ON' , 'CN(C)C(=O)O[N+](C)(C)C' , 'CN(C)C(=O)ONC(=O)N' , 'CNOC(=O)N(C)C' , 'CN(C)C(=O)ONON' , 'CN(C)C(=O)OC#N' , 'CCOC(=O)N(C)C' , 'CN(C)C(=O)OS(=O)O' , 'CCOOC(=O)N(C)C' , 'CN(C)C(=O)O[O-]']

urea = ['CN(C)C(=O)NO' , 'CN(C)C(=O)NS' , 'CN(C)C(=O)NC(=O)O' , 'CN(C)C(=O)NN' , 'CN(C)C(=O)N[N+](C)(C)C' , 'CN(C)C(=O)NNC(=O)N' , 'CNNC(=O)N(C)C' , 'CN(C)C(=O)NNON' , 'CN(C)C(=O)NC#N' , 'CCNC(=O)N(C)C' , 'CN(C)C(=O)NS(=O)O' , 'CCONC(=O)N(C)C' , 'CN(C)C(=O)N[O-]']     
         

## Testing which SMILES strings to use to perform substructure searches with to determine the dihedral for torsion scans

These blocks are used to test which smiles strings to use to determine the dihedral indices of the datasets of molecules 


In [65]:
# find indices for enyl dataset 
for m in enyl: 
    torsion_smarts='[C:1]-[C:2]=[C:3]-[c:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)


Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017c240c0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017c24a50> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017c24f90> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe013e26480> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe013e26360> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe013e46900> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe013e460f0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *'

[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(11, 10, 9, 6)]
[(0, 1, 2, 3)]


In [66]:
#styrene 
for m in styrene: 
    torsion_smarts='[H:1]-[C:2]=[C:3]-[c:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)

Problematic atoms are:
Atom atomic num: 16, name: , idx: 8, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 5, aromatic: True, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 9, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 10, aromatic: False, chiral: False



[(9, 0, 1, 2), (10, 0, 1, 2)]
[(9, 0, 1, 2), (10, 0, 1, 2)]
[(11, 0, 1, 2), (12, 0, 1, 2)]
[(9, 0, 1, 2), (10, 0, 1, 2)]
[(26, 11, 10, 7), (27, 11, 10, 7)]
[(12, 0, 1, 2), (13, 0, 1, 2)]
[(19, 9, 8, 5), (20, 9, 8, 5)]
[(11, 0, 1, 2), (12, 0, 1, 2)]
[(10, 0, 1, 2), (11, 0, 1, 2)]
[(17, 8, 7, 4), (18, 8, 7, 4)]
[(11, 0, 1, 2), (12, 0, 1, 2)]
[(21, 10, 9, 6), (22, 10, 9, 6)]
[(9, 0, 1, 2), (10, 0, 1, 2)]


In [67]:
#amide_primary
for m in amide_primary: 
    torsion_smarts='[H:1]-[N:2]-[C:3]=[O:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)

Problematic atoms are:
Atom atomic num: 16, name: , idx: 5, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False



[(4, 2, 0, 1), (5, 2, 0, 1)]
[(4, 2, 0, 1), (5, 2, 0, 1)]
[(7, 5, 0, 1), (8, 5, 0, 1)]
[(4, 2, 0, 1), (5, 2, 0, 1), (6, 3, 0, 1), (7, 3, 0, 1)]
[(16, 6, 4, 5), (17, 6, 4, 5)]
[(7, 2, 0, 1), (8, 2, 0, 1), (9, 3, 0, 1), (9, 3, 4, 5), (10, 6, 4, 5), (11, 6, 4, 5)]
[(10, 1, 2, 3)]
[(6, 2, 0, 1), (7, 2, 0, 1), (8, 3, 0, 1)]
[(5, 4, 2, 3), (6, 4, 2, 3)]
[(10, 4, 2, 3), (11, 4, 2, 3)]
[]
[(11, 5, 3, 4), (12, 5, 3, 4)]
[(4, 2, 0, 1), (5, 2, 0, 1)]


In [68]:
#amide_secondary
for m in amide_secondary: 
    torsion_smarts='[C:1]-[N:2]-[C:3]=[O:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)

Problematic atoms are:
Atom atomic num: 16, name: , idx: 4, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 2, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False



[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3), (5, 4, 2, 3), (6, 4, 2, 3), (7, 4, 2, 3)]
[(0, 1, 2, 3), (2, 4, 5, 6), (5, 4, 2, 3)]
[(0, 1, 2, 3), (5, 4, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(5, 4, 2, 3)]
[(0, 1, 2, 3)]
[(6, 5, 3, 4)]
[(0, 1, 2, 3)]


In [69]:
#amide_tertiary
for m in amide_tertiary: 
    torsion_smarts='[C:1]-[N:2]-[C:3]=[O:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)

Problematic atoms are:
Atom atomic num: 16, name: , idx: 5, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False



[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4), (6, 5, 3, 4), (7, 5, 3, 4), (8, 5, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4), (3, 5, 6, 7), (6, 5, 3, 4)]
[(0, 1, 2, 3), (5, 4, 2, 3), (6, 4, 2, 3)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(5, 4, 2, 3), (6, 4, 2, 3)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(6, 5, 3, 4), (7, 5, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]


In [70]:
# carbonyl
for m in carbonyl: 
    torsion_smarts='[C:1]=[C:2]-[C:3]=[O:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)


Problematic atoms are:
Atom atomic num: 16, name: , idx: 4, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 2, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False



[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(7, 6, 4, 5)]
[(0, 1, 2, 3)]
[(5, 4, 2, 3)]
[(0, 1, 2, 3)]
[(0, 1, 2, 3)]
[(5, 4, 2, 3)]
[(0, 1, 2, 3)]
[(6, 5, 3, 4)]
[(0, 1, 2, 3)]


In [71]:
#carbamate
for m in carbamate: 
    torsion_smarts='[C:1]-[N:2]-[C:3]=[O:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)

[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(6, 5, 3, 4), (7, 5, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]


Problematic atoms are:
Atom atomic num: 16, name: , idx: 6, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 8, aromatic: False, chiral: False



[(0, 1, 3, 4), (2, 1, 3, 4)]
[(6, 5, 3, 4), (7, 5, 3, 4)]
[(0, 1, 3, 4), (2, 1, 3, 4)]
[(7, 6, 4, 5), (8, 6, 4, 5)]
[(0, 1, 3, 4), (2, 1, 3, 4)]


In [72]:
#urea
for m in urea: 
    torsion_smarts='[C:1]-[N:2]-[C:3]-[N:4]'
    mol=Molecule.from_smiles(m, allow_undefined_stereo=True)
    #print(mol.find_rotatable_bonds())
    omega = mol.chemical_environment_matches(torsion_smarts)
    print(omega)

[(0, 1, 3, 5), (2, 1, 3, 5)]
[(0, 1, 3, 5), (2, 1, 3, 5)]
[(0, 1, 3, 5), (2, 1, 3, 5), (6, 5, 3, 1)]
[(0, 1, 3, 5), (2, 1, 3, 5)]
[(0, 1, 3, 5), (2, 1, 3, 5)]


Problematic atoms are:
Atom atomic num: 16, name: , idx: 6, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 7, name: , idx: 5, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 8, aromatic: False, chiral: False



[(0, 1, 3, 5), (2, 1, 3, 5)]
[(6, 5, 3, 2), (7, 5, 3, 2)]
[(0, 1, 3, 5), (2, 1, 3, 5)]
[(0, 1, 3, 5), (2, 1, 3, 5), (6, 5, 3, 1)]
[(1, 2, 3, 5), (6, 5, 3, 2), (7, 5, 3, 2)]
[(0, 1, 3, 5), (2, 1, 3, 5)]
[(7, 6, 4, 3), (8, 6, 4, 3)]
[(0, 1, 3, 5), (2, 1, 3, 5)]


## Preparing the .json for the dataset submission

In [74]:


factory = TorsiondriveDatasetFactory()

factory.scf_properties


dataset = factory.create_dataset(dataset_name="OpenFF WBO TorsionDrives v1.0",
                                 tagline="Torsiondrives for selected dihedrals of varying WBO",
                                 description="Torsiondrives for selected dihedrals of varying WBO",
                                 molecules=[])

dataset.metadata.long_description_url = "https://github.com/openforcefield/qca-dataset-submission/"

dataset.metadata.submitter = 'jmaat'
dataset.dict()




def populate_dataset(dataset, moleculesDict):
    """
    moleculesDict: key are dataset names and the items are the smiles datasets in a list and also the smiles for the dihedral substrucutres search
    """
    failed=[]
    count=0
    keys=0
    smiles=[]
    for key, item in moleculesDict.items():
        keys+=1
        for s in item[0]:
                smiles.append(s)
                count+=1

                mol=Molecule.from_smiles(s, allow_undefined_stereo=True)
                dihedral_indices = mol.chemical_environment_matches(item[1])
                attributes = factory.create_cmiles_metadata(mol)
                
                print("here")
                
                
                keywords = {"dihedral_ranges": [(-180, 180)]}
                dihedral_indices = [list(indices) for indices in dihedral_indices]
                index=key+ "_" + s
                
                print(mol)
                print(dihedral_indices)
                print(attributes)
                print(keywords)
                
                try: 
                    dataset.add_molecule(index=index,
                         molecule=mol,
                         dihedrals=dihedral_indices,
                         attributes=attributes,
                         keywords=keywords)
                except:
                    print("error")
                    failed.append(s)
                    

    print(failed)   
    print(count)
    print(keys)
    print(smiles)
    print(len(smiles))
    return dataset



Deduplication                 : 0it [00:00, ?it/s]
Preparation                   : 0it [00:00, ?it/s]


In [None]:
#generate the dataset 
moleculesDict={ 'enyl' : [enyl, '[C:1]-[C:2]=[C:3]-[c:4]'], 
                'styrene' : [styrene, '[H:1]-[C:2]=[C:3]-[c:4]'], 
                'amide_primary' :[amide_primary, '[H:1]-[N:2]-[C:3]=[O:4]'], 
                'amide_secondary' :[amide_secondary, '[C:1]-[N:2]-[C:3]=[O:4]'], 
                'amide_tertiary' :[amide_tertiary, '[C:1]-[N:2]-[C:3]=[O:4]'], 
                'carbonyl' :[carbonyl, '[C:1]=[C:2]-[C:3]=[O:4]'], 
                'carbamate' :[carbamate,'[C:1]-[N:2]-[C:3]=[O:4]'], 
                'urea' : [urea,'[C:1]-[N:2]-[C:3]-[N:4]']}


ds=populate_dataset(dataset, moleculesDict)




ds.export_dataset('dataset.json')

#! bzip2 dataset.json
ds.molecules_to_file('molecules_wbo.smi', 'smi')

# deduplicate lines in smiles file
! cat molecules_wbo.smi | uniq > molecules-dedup.smi
! mv molecules-dedup.smi molecules_wbo.smi

ds.visualize('torsions.pdf')


Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a82ea0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a21570> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a9ef30> >]



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])O[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)O' canonical_isomeric_smiles='CC=Cc1ccc(cc1)O' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])O[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])O[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:16][c:5]1[c:6]([c:7]([c:8]([c:9]([c:4]1[C:3](=[C:2]([H:14])[C:1]([H:11])([H:12])[H:13])[H:15])[H:19])[H:18])[O:10][H:20])[H:17]' molecular_formula='C9H10O' standard_inchi='InChI=1S/C9H10O/c1-2-3-8-4-6-9(10)7-5-8/h2-7,10H,1H3' inchi_key='UMFCIIBZHQXRCJ-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])S[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)S' canonical_isomeric_smiles='CC=Cc1ccc(cc1)S' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a9e3f0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017c24030> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe0179fdc90> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe01799f8a0> >]



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])C(=O)O[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)C(=O)O' canonical_isomeric_smiles='CC=Cc1ccc(cc1)C(=O)O' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])C(=O)O[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])C(=O)O[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:18][c:5]1[c:6]([c:7]([c:8]([c:9]([c:4]1[C:3](=[C:2]([H:16])[C:1]([H:13])([H:14])[H:15])[H:17])[H:21])[H:20])[C:10](=[O:11])[O:12][H:22])[H:19]' molecular_formula='C10H10O2' standard_inchi='InChI=1S/C10H10O2/c1-2-3-8-4-6-9(7-5-8)10(11)12/h2-7H,1H3,(H,11,12)' inchi_key='YSJQODKIOLHJOC-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])N([H])[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)N' canonical_isomeric_smiles='CC=Cc1cc

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe01799f3c0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015a81e70> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015a81780> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a9eae0> >]



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])[N+](C([H])([H])[H])(C([H])([H])[H])C([H])([H])[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)[N+](C)(C)C' canonical_isomeric_smiles='CC=Cc1ccc(cc1)[N+](C)(C)C' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])[N+](C([H])([H])[H])(C([H])([H])[H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])[N+](C([H])([H])[H])(C([H])([H])[H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:19][c:5]1[c:6]([c:7]([c:8]([c:9]([c:4]1[C:3](=[C:2]([H:17])[C:1]([H:14])([H:15])[H:16])[H:18])[H:22])[H:21])[N+:10]([C:11]([H:23])([H:24])[H:25])([C:12]([H:26])([H:27])[H:28])[C:13]([H:29])([H:30])[H:31])[H:20]' molecular_formula='C12H18N' standard_inchi='InChI=1S/C12H18N/c1-5-6-11-7-9-12(10-8-11)13(2,3)4/h5-10H,1-4H3/q+1' inchi_key='KWNXUIQDSPKVJP-UHFFFAOYSA-N'
{'dihedral_ranges': [(-18

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015a816f0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015a81bd0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017c24d20> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015d4bea0> >]



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])N([H])C([H])([H])[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)NC' canonical_isomeric_smiles='CC=Cc1ccc(cc1)NC' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])N([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])N([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:17][c:5]1[c:6]([c:7]([c:8]([c:9]([c:4]1[C:3](=[C:2]([H:15])[C:1]([H:12])([H:13])[H:14])[H:16])[H:20])[H:19])[N:10]([H:21])[C:11]([H:22])([H:23])[H:24])[H:18]' molecular_formula='C10H13N' standard_inchi='InChI=1S/C10H13N/c1-3-4-9-5-7-10(11-2)8-6-9/h3-8,11H,1-2H3' inchi_key='KJJDBVRTBKXDIV-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])N([H])ON([H])[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)N

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015a354e0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015d4b7b0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a82240> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017a21270> >]



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C#N)[H])[H])C(=C([H])C([H])([H])[H])[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)C#N' canonical_isomeric_smiles='CC=Cc1ccc(cc1)C#N' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C#N)[H])[H])C(=C([H])C([H])([H])[H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C#N)[H])[H])C(=C([H])C([H])([H])[H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:18][c:6]1[c:5]([c:4]([c:9]([c:8]([c:7]1[C:10]#[N:11])[H:19])[H:20])[C:3](=[C:2]([H:15])[C:1]([H:12])([H:13])[H:14])[H:16])[H:17]' molecular_formula='C10H9N' standard_inchi='InChI=1S/C10H9N/c1-2-3-9-4-6-10(8-11)7-5-9/h2-7H,1H3' inchi_key='DTFJDKQVJTWWAB-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])C([H])([H])[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)C' canonical_isomeric_smiles='CC=Cc1ccc(cc1)C' canonical_explicit_hydrogen_smiles='[H]c1

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe015ad0e10> >]

Problematic atoms are:
Atom atomic num: 16, name: , idx: 9, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 6, aromatic: True, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 10, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 11, aromatic: False, chiral: False
Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe0179fdcf0> >]

Problematic atoms are:
Atom atomic num: 16, name: , idx: 9, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 6, aromatic: True, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 10, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic 

here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])S(=O)O[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)S(=O)O' canonical_isomeric_smiles='CC=Cc1ccc(cc1)S(=O)O' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])S(=O)O[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])S(=O)O[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:18][c:5]1[c:6]([c:7]([c:8]([c:9]([c:4]1[C:3](=[C:2]([H:16])[C:1]([H:13])([H:14])[H:15])[H:17])[H:21])[H:20])[S:10](=[O:11])[O:12][H:22])[H:19]' molecular_formula='C9H10O2S' standard_inchi='InChI=1S/C9H10O2S/c1-2-3-8-4-6-9(7-5-8)12(10)11/h2-7H,1H3,(H,10,11)' inchi_key='ZEHBEWKQJLBGOQ-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])OC([H])([H])C([H])([H])[H])[H]'
[[11, 10, 9, 6]]
canonical_smiles='CCOc1ccc(cc1)C=CC' canonical_isom

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017cc4ae0> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017cc4570> >]

Problematic bonds are: [<openeye.oechem.OEBondBase; proxy of <Swig Object of type 'OEChem::OEBondBase *' at 0x7fe017cc42d0> >]



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])[O-])[H]'
[[0, 1, 2, 3]]
canonical_smiles='CC=Cc1ccc(cc1)[O-]' canonical_isomeric_smiles='CC=Cc1ccc(cc1)[O-]' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])[O-])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])C([H])([H])[H])[H])[H])[H])[O-])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:16][c:5]1[c:6]([c:7]([c:8]([c:9]([c:4]1[C:3](=[C:2]([H:14])[C:1]([H:11])([H:12])[H:13])[H:15])[H:19])[H:18])[O-:10])[H:17]' molecular_formula='C9H9O' standard_inchi='InChI=1S/C9H10O/c1-2-3-8-4-6-9(10)7-5-8/h2-7,10H,1H3/p-1' inchi_key='UMFCIIBZHQXRCJ-UHFFFAOYSA-M'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])O[H])[H]'
[[9, 0, 1, 2], [10, 0, 1, 2]]
canonical_smiles='C=Cc1ccc(cc1)O' canonical_isomeric_smiles='C=Cc1ccc(cc1)O' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(

Problematic atoms are:
Atom atomic num: 16, name: , idx: 8, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 5, aromatic: True, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 9, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 10, aromatic: False, chiral: False



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])C([H])([H])[H])[H]'
[[17, 8, 7, 4], [18, 8, 7, 4]]
canonical_smiles='Cc1ccc(cc1)C=C' canonical_isomeric_smiles='Cc1ccc(cc1)C=C' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:14][c:4]1[c:3]([c:2]([c:7]([c:6]([c:5]1[C:8](=[C:9]([H:18])[H:19])[H:17])[H:15])[H:16])[C:1]([H:10])([H:11])[H:12])[H:13]' molecular_formula='C9H10' standard_inchi='InChI=1S/C9H10/c1-3-9-6-4-8(2)5-7-9/h3-7H,1H2,2H3' inchi_key='JLBJTVDPSNHSKJ-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])S(=O)O[H])[H]'
[[11, 0, 1, 2], [12, 0, 1, 2]]
canonical_smiles='C=Cc1ccc(cc1)S(=O)O' canonical_isomeric_smiles='C=Cc1ccc(cc1)S(=O)O' canonical_explicit_hydrogen_smiles

Problematic atoms are:
Atom atomic num: 16, name: , idx: 8, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 5, aromatic: True, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 9, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 10, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 14, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: True, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 15, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 16, aromatic: False, chiral: False



here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])OC([H])([H])C([H])([H])[H])[H]'
[[21, 10, 9, 6], [22, 10, 9, 6]]
canonical_smiles='CCOc1ccc(cc1)C=C' canonical_isomeric_smiles='CCOc1ccc(cc1)C=C' canonical_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])OC([H])([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])OC([H])([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:18][c:6]1[c:5]([c:4]([c:9]([c:8]([c:7]1[C:10](=[C:11]([H:22])[H:23])[H:21])[H:19])[H:20])[O:3][C:2]([H:15])([H:16])[C:1]([H:12])([H:13])[H:14])[H:17]' molecular_formula='C10H12O' standard_inchi='InChI=1S/C10H12O/c1-3-9-5-7-10(8-6-9)11-4-2/h3,5-8H,1,4H2,2H3' inchi_key='OBRYRJYZWVLVLF-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]c1c(c(c(c(c1C(=C([H])[H])[H])[H])[H])[O-])[H]'
[[9, 0, 1, 2], [10, 0, 1, 2]]
canonical_smiles='C=Cc1ccc(cc1)[O-]' canoni

Problematic atoms are:
Atom atomic num: 16, name: , idx: 5, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 5, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 7, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 5, aromatic: False, chiral: False

here
Molecule with name '' and SMILES '[H]C([H])([H])N(C(=O)S(=O)O[H])C([H])([H])[H]'
[]
canonical_smiles='CN(C)C(=O)S(=O)O' canonical_isomeric_smiles='CN(C)C(=O)S(=O)O' canonical_explicit_hydrogen_smiles='[H]C([H])([H])N(C(=O)S(=O)O[H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])N(C(=O)S(=O)O[H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:9][C:1]([H:10])([H:11])[N:2]([C:4](=[O:5])[S:6](=[O:7])[O:8][H:15])[C:3]([H:12])([H:13])[H:14]' molecular_formula='C3H7NO3S' standard_inchi='InChI=1S/C3H7NO3S/c1-4(2)3(5)8(6)7/h1-2H3,(H,6,7)' inchi_key='ZGFSFYSTJWNFMV-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C([H])([H])C([H])([H])OC(=O)N([H])[H]'
[[11, 5, 3, 4], [12, 5, 3, 4]]
canonical_smiles='CCOC(=O)N' canonical_isomeric_smiles='CCOC(=O)N' canonical_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])OC(=O)N([H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])OC(=O)

Problematic atoms are:
Atom atomic num: 16, name: , idx: 4, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 2, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False



here
Molecule with name '' and SMILES '[H]C([H])([H])C([H])([H])C(=O)N([H])C([H])([H])[H]'
[[5, 4, 2, 3]]
canonical_smiles='CCC(=O)NC' canonical_isomeric_smiles='CCC(=O)NC' canonical_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])C(=O)N([H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])C(=O)N([H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:7][C:1]([H:8])([H:9])[C:2]([H:10])([H:11])[C:3](=[O:4])[N:5]([H:12])[C:6]([H:13])([H:14])[H:15]' molecular_formula='C4H9NO' standard_inchi='InChI=1S/C4H9NO/c1-3-4(6)5-2/h3H2,1-2H3,(H,5,6)' inchi_key='QJQAMHYHNCADNR-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C([H])([H])N([H])C(=O)S(=O)O[H]'
[[0, 1, 2, 3]]
canonical_smiles='CNC(=O)S(=O)O' canonical_isomeric_smiles='CNC(=O)S(=O)O' canonical_explicit_hydrogen_smiles='[H]C([H])([H])N([H])C(=O)S(=O)O[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])N([H])C(=O)S(=O)O[H]' canon

Problematic atoms are:
Atom atomic num: 16, name: , idx: 4, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 2, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 8, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 6, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 9, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 10, aromatic: False, chiral: False



here
Molecule with name '' and SMILES '[H]C([H])([H])C([H])([H])OC(=O)N([H])C([H])([H])[H]'
[[6, 5, 3, 4]]
canonical_smiles='CCOC(=O)NC' canonical_isomeric_smiles='CCOC(=O)NC' canonical_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])OC(=O)N([H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])OC(=O)N([H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:8][C:1]([H:9])([H:10])[C:2]([H:11])([H:12])[O:3][C:4](=[O:5])[N:6]([H:13])[C:7]([H:14])([H:15])[H:16]' molecular_formula='C4H9NO2' standard_inchi='InChI=1S/C4H9NO2/c1-3-7-4(6)5-2/h3H2,1-2H3,(H,5,6)' inchi_key='SURZCVYFPAXNGN-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C([H])([H])N([H])C(=O)[O-]'
[[0, 1, 2, 3]]
canonical_smiles='CNC(=O)[O-]' canonical_isomeric_smiles='CNC(=O)[O-]' canonical_explicit_hydrogen_smiles='[H]C([H])([H])N([H])C(=O)[O-]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])N([H])C(=O)[O-]' canonical

Problematic atoms are:
Atom atomic num: 16, name: , idx: 5, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 5, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 3, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 7, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 5, aromatic: False, chiral: False

here
Molecule with name '' and SMILES '[H]C([H])([H])N(C(=O)S(=O)O[H])C([H])([H])[H]'
[[0, 1, 3, 4], [2, 1, 3, 4]]
canonical_smiles='CN(C)C(=O)S(=O)O' canonical_isomeric_smiles='CN(C)C(=O)S(=O)O' canonical_explicit_hydrogen_smiles='[H]C([H])([H])N(C(=O)S(=O)O[H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])N(C(=O)S(=O)O[H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:9][C:1]([H:10])([H:11])[N:2]([C:4](=[O:5])[S:6](=[O:7])[O:8][H:15])[C:3]([H:12])([H:13])[H:14]' molecular_formula='C3H7NO3S' standard_inchi='InChI=1S/C3H7NO3S/c1-4(2)3(5)8(6)7/h1-2H3,(H,6,7)' inchi_key='ZGFSFYSTJWNFMV-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C([H])([H])C([H])([H])OC(=O)N(C([H])([H])[H])C([H])([H])[H]'
[[6, 5, 3, 4], [7, 5, 3, 4]]
canonical_smiles='CCOC(=O)N(C)C' canonical_isomeric_smiles='CCOC(=O)N(C)C' canonical_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])OC(=O)N(C([H])([H])[H])C([H])([H])[H]' 

Problematic atoms are:
Atom atomic num: 16, name: , idx: 4, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 2, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False



here
Molecule with name '' and SMILES '[H]C(=C([H])C(=O)C([H])([H])C([H])([H])[H])[H]'
[[5, 4, 2, 3]]
canonical_smiles='CCC(=O)C=C' canonical_isomeric_smiles='CCC(=O)C=C' canonical_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)C([H])([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)C([H])([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:13][C:6](=[C:5]([H:12])[C:3](=[O:4])[C:2]([H:10])([H:11])[C:1]([H:7])([H:8])[H:9])[H:14]' molecular_formula='C5H8O' standard_inchi='InChI=1S/C5H8O/c1-3-5(6)4-2/h3H,1,4H2,2H3' inchi_key='JLIDVCMBCGBIEY-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C(=C([H])C(=O)S(=O)O[H])[H]'
[[0, 1, 2, 3]]
canonical_smiles='C=CC(=O)S(=O)O' canonical_isomeric_smiles='C=CC(=O)S(=O)O' canonical_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)S(=O)O[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)S(=O)O[H])[H]' canonical_isomeric_explicit_hydrogen_ma

Problematic atoms are:
Atom atomic num: 16, name: , idx: 4, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 2, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 6, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 6, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 6, name: , idx: 4, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 8, aromatic: False, chiral: False



here
Molecule with name '' and SMILES '[H]C(=C([H])C(=O)OC([H])([H])C([H])([H])[H])[H]'
[[6, 5, 3, 4]]
canonical_smiles='CCOC(=O)C=C' canonical_isomeric_smiles='CCOC(=O)C=C' canonical_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)OC([H])([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)OC([H])([H])C([H])([H])[H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:14][C:7](=[C:6]([H:13])[C:4](=[O:5])[O:3][C:2]([H:11])([H:12])[C:1]([H:8])([H:9])[H:10])[H:15]' molecular_formula='C5H8O2' standard_inchi='InChI=1S/C5H8O2/c1-3-5(6)7-4-2/h3H,1,4H2,2H3' inchi_key='JIGUQPWFLRLWPJ-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C(=C([H])C(=O)[O-])[H]'
[[0, 1, 2, 3]]
canonical_smiles='C=CC(=O)[O-]' canonical_isomeric_smiles='C=CC(=O)[O-]' canonical_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)[O-])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C(=C([H])C(=O)[O-])[H]' canonical_isomeric_explicit_hydrogen_mapped

Problematic atoms are:
Atom atomic num: 16, name: , idx: 6, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 8, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 6, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 5, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 8, aromatic: False, chiral: False

Problematic atoms are:
Atom atomic num: 16, name: , idx: 8, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False

here
Molecule with name '' and SMILES '[H]C([H])([H])N(C(=O)OS(=O)O[H])C([H])([H])[H]'
[[0, 1, 3, 4], [2, 1, 3, 4]]
canonical_smiles='CN(C)C(=O)OS(=O)O' canonical_isomeric_smiles='CN(C)C(=O)OS(=O)O' canonical_explicit_hydrogen_smiles='[H]C([H])([H])N(C(=O)OS(=O)O[H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_smiles='[H]C([H])([H])N(C(=O)OS(=O)O[H])C([H])([H])[H]' canonical_isomeric_explicit_hydrogen_mapped_smiles='[H:10][C:1]([H:11])([H:12])[N:2]([C:4](=[O:5])[O:6][S:7](=[O:8])[O:9][H:16])[C:3]([H:13])([H:14])[H:15]' molecular_formula='C3H7NO4S' standard_inchi='InChI=1S/C3H7NO4S/c1-4(2)3(5)8-9(6)7/h1-2H3,(H,6,7)' inchi_key='QTWPFTUNHADFQB-UHFFFAOYSA-N'
{'dihedral_ranges': [(-180, 180)]}
here
Molecule with name '' and SMILES '[H]C([H])([H])C([H])([H])OOC(=O)N(C([H])([H])[H])C([H])([H])[H]'
[[7, 6, 4, 5], [8, 6, 4, 5]]
canonical_smiles='CCOOC(=O)N(C)C' canonical_isomeric_smiles='CCOOC(=O)N(C)C' canonical_explicit_hydrogen_smiles='[H]C([H])([H])C([H])([H])OOC(=O)N(C([H])([H])[H]

Problematic atoms are:
Atom atomic num: 16, name: , idx: 6, aromatic: False, chiral: True with bonds:
bond order: 1, chiral: False to atom atomic num: 7, name: , idx: 5, aromatic: False, chiral: False
bond order: 2, chiral: False to atom atomic num: 8, name: , idx: 7, aromatic: False, chiral: False
bond order: 1, chiral: False to atom atomic num: 8, name: , idx: 8, aromatic: False, chiral: False



In [None]:
#get dataset metadata
print(ds.n_molecules)
print(ds.n_records)