In [1]:
from rdkit import Chem
import gzip
from rdkit.Chem import rdDistGeom
import pickle
import rdkit
import os
print(f'RDKit version: {rdkit.__version__}')

from tqdm import tqdm

import time
numConfs=1
def generate_confs(smiles):
    etkdg = rdDistGeom.ETKDGv3()
    etkdg.randomSeed = 0xa700f
    etkdg.verbose = False
    etkdg.numThreads = 4
    etkdg.trackFailures = True
    etkdg.useRandomCoords = True
    etkdg.pruneRmsThresh = 0.1
    confs_generated = []

    for smi in tqdm(smiles):
        m = Chem.MolFromSmiles(smi)
        if m is None:
            print(f'Failed to create mol from SMILES: {smi}')
            continue
        m = Chem.AddHs(m)
        try:
            rdDistGeom.EmbedMultipleConfs(m,numConfs = numConfs, params = etkdg)
        except:
            print(f'Failed to generate conformers for SMILES: {smi}')
            continue
        confs_generated.append(m.GetNumConformers())
    return confs_generated

RDKit version: 2023.03.3


In [2]:
import pandas as pd
df = pd.read_csv('OPERA_Naef_Training.csv')
molblocks = df['molblock'].tolist()
mols = [Chem.MolFromMolBlock(mb) for mb in molblocks]
smiles = [Chem.MolToSmiles(m) for m in mols]

start = time.time()
confs_generated = generate_confs(smiles)
end = time.time()
print(confs_generated)


 70%|██████▉   | 2112/3018 [00:30<00:18, 49.24it/s] [21:26:37] UFFTYPER: Unrecognized atom type: S_6+6 (5)
[21:26:37] UFFTYPER: Unrecognized atom type: S_5+4 (7)
 71%|███████   | 2138/3018 [00:30<00:10, 82.04it/s][21:26:37] UFFTYPER: Unrecognized atom type: S_5+4 (4)
 73%|███████▎  | 2191/3018 [00:30<00:06, 131.08it/s][21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (4)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (11)
 73%|███████▎  | 2215/3018 [00:30<00:05, 157.20it/s][21:26:38] UFFTYPER: Unrecognized atom type: S_5+4 (7)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (3)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (11)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (9)
 74%|███████▍  | 2241/3018 [00:31<00:04, 183.09it/s][21:26:38] UFFTYPER: Unrecognized atom type: S_5+4 (5)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (1)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (7)
[21:26:38] UFFTYPER: Unrecognized atom type: S_6+6 (13)
 76%|███████▌  | 2295/3

[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 


