In [None]:
import os
import numpy as np
from rdkit import Chem
import selfies as sf

# ---------- CONFIG ----------
sdf_file = r"D:\molecule3d\data\data\raw\combined_mols_0_to_1000000.sdf"
output_dir = r"D:\molecule3d\data\processed"
os.makedirs(output_dir, exist_ok=True)

# ---------- STORAGE LISTS ----------
all_atom_types = []
all_coords = []
all_smiles = []
all_selfies = []

# ---------- PROCESS SDF ----------
supplier = Chem.SDMolSupplier(sdf_file, sanitize=False)
for i, mol in enumerate(supplier):
    if mol is None:
        continue  # skip invalid molecules

    try:
        # optional: sanitize molecule without kekulization
        Chem.SanitizeMol(mol, sanitizeOps=Chem.SanitizeFlags.SANITIZE_ALL ^ Chem.SanitizeFlags.SANITIZE_KEKULIZE)
    except:
        pass

    # Remove explicit hydrogens to simplify
    #mol = Chem.RemoveHs(mol)

    # Get atom types and coordinates
    atom_types = [atom.GetSymbol() for atom in mol.GetAtoms()]
    coords = [mol.GetConformer().GetAtomPosition(i) for i in range(mol.GetNumAtoms())]
    coords = [[p.x, p.y, p.z] for p in coords]

    all_atom_types.append(atom_types)
    all_coords.append(coords)

    # SMILES
    try:
        smiles = Chem.MolToSmiles(mol, kekuleSmiles=False)
    except:
        smiles = ""
    all_smiles.append(smiles)

    # SELFIES
    try:
        selfies_str = sf.encoder(smiles) if smiles else ""
    except:
        selfies_str = ""
    all_selfies.append(selfies_str)

    if (i+1) % 10000 == 0:
        print(f"Processed {i+1} molecules...")

# ---------- SAVE TO NPZ ----------
np.savez_compressed(
    os.path.join(output_dir, "molecules_last_.9_million.npz"),
    atom_types=np.array(all_atom_types, dtype=object),
    coords=np.array(all_coords, dtype=object),
    smiles=np.array(all_smiles, dtype=object),
    selfies=np.array(all_selfies, dtype=object)
)

print("Finished processing and saved to NPZ!")

[22:45:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0


Processed 10000 molecules...
Processed 20000 molecules...
Processed 30000 molecules...
Processed 40000 molecules...
Processed 50000 molecules...
Processed 60000 molecules...
Processed 70000 molecules...
Processed 80000 molecules...
Processed 90000 molecules...
Processed 100000 molecules...
Processed 110000 molecules...
Processed 120000 molecules...
Processed 130000 molecules...


[22:48:14] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3


Processed 140000 molecules...


[22:48:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1


Processed 150000 molecules...
Processed 160000 molecules...


[22:49:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:49:04] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0


Processed 170000 molecules...
Processed 180000 molecules...
Processed 190000 molecules...
Processed 200000 molecules...
Processed 210000 molecules...
Processed 220000 molecules...


[22:50:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 5


Processed 230000 molecules...
Processed 240000 molecules...
Processed 250000 molecules...


[22:50:44] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:50:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:50:49] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0


Processed 260000 molecules...
Processed 270000 molecules...
Processed 280000 molecules...
Processed 290000 molecules...
Processed 300000 molecules...
Processed 310000 molecules...
Processed 320000 molecules...


[22:52:06] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4


Processed 330000 molecules...


[22:52:24] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0


Processed 340000 molecules...


[22:52:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4


Processed 350000 molecules...


[22:52:50] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 0


Processed 360000 molecules...


[22:52:53] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 3
[22:52:53] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 3
[22:52:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 6
[22:52:57] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 10
[22:52:57] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 5
[22:52:57] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 4
[22:52:59] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:53:00] The 2 defining bonds for an atropisomer are co-planar - atoms are: 7 4
[22:53:00] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 3
[22:53:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 13
[22:53:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 7


Processed 370000 molecules...


[22:53:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 10
[22:53:04] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 8
[22:53:04] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 8
[22:53:04] Explicit valence for atom # 7 Si, 5, is greater than permitted
[22:53:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 6
[22:53:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 4
[22:53:10] The 2 defining bonds for an atropisomer are co-planar - atoms are: 7 10
[22:53:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:53:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:53:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:53:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:53:12] Both bonds on one end of an 

Processed 380000 molecules...


[22:53:15] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 6
[22:53:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 6
[22:53:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 7
[22:53:19] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:21] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 3


Processed 390000 molecules...


[22:53:24] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 2
[22:53:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 1
[22:53:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 0
[22:53:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 2
[22:53:29] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 10
[22:53:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 4
[22:53:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 5
[22:53:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 6
[22:53:30] The 2 defining bonds for an atropisomer are co-planar - atoms are: 7 6
[22:53:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 3
[22:53:31] Both bonds on on

Processed 400000 molecules...


[22:53:33] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:53:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 6
[22:53:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 8
[22:53:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 10
[22:53:41] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 11
[22:53:42] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 8
[22:53:43] The 2 defining bonds for an atropisomer are co-planar - atoms are: 13 11
[22:53:43] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 3


Processed 410000 molecules...


[22:53:49] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:49] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:53:50] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 2
[22:53:51] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 6
[22:53:51] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 1
[22:53:52] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0


Processed 420000 molecules...


[22:53:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 3
[22:53:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 5
[22:53:56] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 4
[22:53:57] The 2 defining bonds for an atropisomer are co-planar - atoms are: 7 6
[22:53:59] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:54:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:54:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 11
[22:54:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 8
[22:54:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 8


Processed 430000 molecules...


[22:54:06] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 8
[22:54:06] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 7
[22:54:06] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 2
[22:54:08] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 3
[22:54:08] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 2
[22:54:08] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 3
[22:54:08] The 2 defining bonds for an atropisomer are co-planar - atoms are: 8 6
[22:54:09] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 11
[22:54:10] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 3
[22:54:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 14
[22:54:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 14 15
[22:54:12] Both bonds on one end of a

Processed 440000 molecules...


[22:54:14] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 8
[22:54:15] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 5
[22:54:15] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:54:16] The 2 defining bonds for an atropisomer are co-planar - atoms are: 8 2
[22:54:16] The 2 defining bonds for an atropisomer are co-planar - atoms are: 0 2
[22:54:19] The 2 defining bonds for an atropisomer are co-planar - atoms are: 0 9
[22:54:19] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:54:21] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 7
[22:54:22] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:54:22] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 6
[22:54:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 5
[22:54:26] Both bonds on one end of an atropisomer are on the 

Processed 450000 molecules...


[22:54:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 0
[22:54:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 1
[22:54:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 1 0
[22:54:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 1
[22:54:30] The 2 defining bonds for an atropisomer are co-planar - atoms are: 12 10
[22:54:32] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 1
[22:54:32] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 6
[22:54:33] Explicit valence for atom # 6 Si, 5, is greater than permitted
[22:54:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 8
[22:54:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:54:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:54:35] Both bonds on one end of an atropisomer are on the same si

Processed 460000 molecules...


[22:54:37] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 5
[22:54:37] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 0
[22:54:37] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 3
[22:54:38] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 8
[22:54:39] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 3
[22:54:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 7
[22:54:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 12
[22:54:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 7
[22:54:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 4
[22:54:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 7
[22:54:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 5
[22:54:41] Both bonds on one en

Processed 470000 molecules...


[22:54:47] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 2
[22:54:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3
[22:54:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 0
[22:54:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 6
[22:54:49] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 2
[22:54:49] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3
[22:54:50] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:54:57] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3


Processed 480000 molecules...


[22:54:58] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 0
[22:54:58] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 5
[22:54:59] The 2 defining bonds for an atropisomer are co-planar - atoms are: 8 10
[22:55:00] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:55:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 6
[22:55:01] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:55:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 1
[22:55:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 7
[22:55:03] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 2
[22:55:03] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 5
[22:55:03] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 4
[22:55:03] The 2 defining bonds for an atropisomer are 

Processed 490000 molecules...


[22:55:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:55:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:55:14] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 1
[22:55:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:55:18] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 2


Processed 500000 molecules...


[22:55:21] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 12
[22:55:27] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 6
[22:55:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 0


Processed 510000 molecules...


[22:55:29] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 7
[22:55:29] The 2 defining bonds for an atropisomer are co-planar - atoms are: 8 12
[22:55:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:55:30] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 3
[22:55:31] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:55:31] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 7
[22:55:31] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 5
[22:55:33] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 7
[22:55:33] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 8
[22:55:33] The 2 defining bonds for an atropisomer are co-planar - atoms are: 12 11
[22:55:33] Both bonds on one end of an atropisomer are on the same side - atoms are: 14 7
[22:55:33] Both bonds on one end of

Processed 520000 molecules...


[22:55:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 7
[22:55:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 8
[22:55:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:55:42] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 7
[22:55:42] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 7
[22:55:42] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:55:43] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 4
[22:55:43] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 6
[22:55:43] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3
[22:55:44] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 9
[22:55:44] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 9
[22:55:46] Both bonds

Processed 530000 molecules...


[22:55:51] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 3
[22:55:53] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 2
[22:55:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 4
[22:55:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 0
[22:55:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 0
[22:55:56] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:55:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 2
[22:55:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 7
[22:55:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 2
[22:55:57] The 2 defining bonds for an atropisomer are co-planar - atoms are: 8 7
[22:55:57] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 5
[22:55:57] Both bonds on one end of

Processed 540000 molecules...


[22:56:00] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 0
[22:56:00] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 4
[22:56:02] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 10
[22:56:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 12
[22:56:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 13
[22:56:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 10
[22:56:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 1
[22:56:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 6
[22:56:04] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 3
[22:56:05] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 6
[22:56:05] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:56:06] The 2 defining bond

Processed 550000 molecules...


[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 0
[22:56:11] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 2
[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 3
[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 9
[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 0
[22:56:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 7
[22:56:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3
[22:56:14] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 5
[22:56:14] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 6
[22:56:14] Both bonds on one end of

Processed 560000 molecules...


[22:56:20] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 8
[22:56:20] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 4
[22:56:20] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 7
[22:56:20] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 3
[22:56:21] Both bonds on one end of an atropisomer are on the same side - atoms are: 14 12
[22:56:21] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:56:23] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 6
[22:56:24] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 0
[22:56:24] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 6
[22:56:25] The 2 defining bonds for an atropisomer are co-planar - atoms are: 1 3
[22:56:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 8
[22:56:30] Both bonds on 

Processed 570000 molecules...


[22:56:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 3
[22:56:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 4
[22:56:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:56:35] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 4
[22:56:36] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 6
[22:56:36] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 10
[22:56:36] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:56:38] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:56:41] Unexpected error hit on line 39761047
[22:56:41] ERROR: moving to the beginning of the next molecule


Processed 580000 molecules...


[22:56:42] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 7
[22:56:42] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 2
[22:56:42] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 4
[22:56:45] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 13
[22:56:46] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 1
[22:56:46] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:56:46] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 5
[22:56:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 2
[22:56:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 3
[22:56:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 6
[22:56:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 7
[22:56:51] Both bonds on one en

Processed 590000 molecules...


[22:56:53] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 4
[22:56:53] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 3
[22:56:54] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 14 12
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 11
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 16 14
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 15 13
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 15 13
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 16 14
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 16 14
[22:56:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 15
[22:56:55] Both bon

Processed 600000 molecules...


[22:57:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 6
[22:57:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 7
[22:57:03] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 9
[22:57:04] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 8
[22:57:04] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 11
[22:57:09] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 6
[22:57:09] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 5
[22:57:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 3
[22:57:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 5
[22:57:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 5


Processed 610000 molecules...


[22:57:13] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 7
[22:57:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 1
[22:57:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 6
[22:57:14] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:57:14] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 15
[22:57:15] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:57:16] Both bonds on one end of an atropisomer are on the same side - atoms are: 15 14
[22:57:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 1
[22:57:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 4
[22:57:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 7
[22:57:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 8
[22:57:18] Both bonds on

Processed 620000 molecules...


[22:57:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:57:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:57:26] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:57:27] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 9
[22:57:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 4
[22:57:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 0
[22:57:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 6
[22:57:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 8
[22:57:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 8
[22:57:31] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:57:33] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:57:34] Both bonds

Processed 630000 molecules...


[22:57:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:57:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:57:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 3
[22:57:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 7
[22:57:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3
[22:57:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 1
[22:57:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 6
[22:57:35] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 3
[22:57:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 6
[22:57:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 1
[22:57:35] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 7
[22:57:36] Both bonds on one

Processed 640000 molecules...


[22:57:45] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:57:46] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 10
[22:57:46] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 10
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 2
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 14
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 11
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 7
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 10
[22:57:47] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 0
[22:57:47] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 10
[22:57:47] Both b

Processed 650000 molecules...


[22:57:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 2
[22:57:55] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 7
[22:57:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 3
[22:57:56] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 2
[22:57:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:58:00] The 2 defining bonds for an atropisomer are co-planar - atoms are: 8 7
[22:58:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:58:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[22:58:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 4
[22:58:02] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 1
[22:58:02] The 2 defining bonds for an atropisomer are co-planar - atoms are: 7 5
[22:58:02] The 2 defining bonds for an atropisome

Processed 660000 molecules...


[22:58:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 15 14
[22:58:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 14
[22:58:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 15
[22:58:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 5
[22:58:07] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 9
[22:58:10] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 10
[22:58:10] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:58:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 3
[22:58:11] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 3
[22:58:11] The 2 defining bonds for an atropisomer are co-planar - atoms are: 7 8
[22:58:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 4
[22:58:13] Both bo

Processed 670000 molecules...


[22:58:16] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 8
[22:58:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 4
[22:58:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:58:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 4
[22:58:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:58:19] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3
[22:58:20] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 6
[22:58:20] Both bonds on one end of an atropisomer are on the same side - atoms are: 13 6
[22:58:23] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 12
[22:58:23] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 12
[22:58:24] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 5
[22:58:24] Both bonds on one e

Processed 680000 molecules...


[22:58:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 10
[22:58:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 8 0
[22:58:29] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 7
[22:58:29] Both bonds on one end of an atropisomer are on the same side - atoms are: 7 1
[22:58:30] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:58:32] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 13


Processed 690000 molecules...


[22:58:40] Explicit valence for atom # 7 Si, 5, is greater than permitted
[22:58:44] Both bonds on one end of an atropisomer are on the same side - atoms are: 12 9
[22:58:45] The 2 defining bonds for an atropisomer are co-planar - atoms are: 13 7


Processed 700000 molecules...


[22:58:50] The 2 defining bonds for an atropisomer are co-planar - atoms are: 12 13
[22:58:50] The 2 defining bonds for an atropisomer are co-planar - atoms are: 11 12


Processed 710000 molecules...


[22:59:01] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:59:04] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 0
[22:59:08] The 2 defining bonds for an atropisomer are co-planar - atoms are: 11 10
[22:59:10] The 2 defining bonds for an atropisomer are co-planar - atoms are: 1 2
[22:59:10] The 2 defining bonds for an atropisomer are co-planar - atoms are: 0 2
[22:59:12] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 1


Processed 720000 molecules...


[22:59:13] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 2
[22:59:15] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 8
[22:59:15] The 2 defining bonds for an atropisomer are co-planar - atoms are: 1 0
[22:59:15] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 3
[22:59:15] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:59:16] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 8
[22:59:16] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 7
[22:59:16] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 10
[22:59:16] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 11
[22:59:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 5
[22:59:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 14 11
[22:59:17] Both bonds on one end of a

Processed 730000 molecules...


[22:59:23] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 6
[22:59:25] Explicit valence for atom # 3 Si, 5, is greater than permitted
[22:59:25] Explicit valence for atom # 14 Si, 5, is greater than permitted
[22:59:25] Explicit valence for atom # 5 Si, 5, is greater than permitted
[22:59:25] Explicit valence for atom # 4 Si, 5, is greater than permitted
[22:59:25] Explicit valence for atom # 3 Si, 5, is greater than permitted
[22:59:31] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:59:31] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 0
[22:59:31] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 0


Processed 740000 molecules...


[22:59:33] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 2
[22:59:38] Explicit valence for atom # 2 Si, 5, is greater than permitted
[22:59:38] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 6
[22:59:38] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 4
[22:59:38] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 5
[22:59:38] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:59:40] The 2 defining bonds for an atropisomer are co-planar - atoms are: 0 10
[22:59:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[22:59:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:59:41] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 4
[22:59:41] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 1
[22:59:41] Both bonds on one end of an atropisomer are on the s

Processed 750000 molecules...


[22:59:43] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[22:59:44] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 5
[22:59:50] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0
[22:59:50] The 2 defining bonds for an atropisomer are co-planar - atoms are: 14 7
[22:59:50] Both bonds on one end of an atropisomer are on the same side - atoms are: 11 7


Processed 760000 molecules...


[22:59:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 2
[22:59:55] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 6
[22:59:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 1
[22:59:56] The 2 defining bonds for an atropisomer are co-planar - atoms are: 2 3
[22:59:56] The 2 defining bonds for an atropisomer are co-planar - atoms are: 3 4
[22:59:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 2
[22:59:56] Both bonds on one end of an atropisomer are on the same side - atoms are: 3 1
[22:59:57] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 0


Processed 770000 molecules...
Processed 780000 molecules...


[23:00:20] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 10
[23:00:20] The 2 defining bonds for an atropisomer are co-planar - atoms are: 16 8
[23:00:21] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 10
[23:00:23] The 2 defining bonds for an atropisomer are co-planar - atoms are: 14 7
[23:00:23] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 10
[23:00:23] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 11
[23:00:23] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 11
[23:00:24] The 2 defining bonds for an atropisomer are co-planar - atoms are: 12 8
[23:00:24] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 15
[23:00:24] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 16


Processed 790000 molecules...


[23:00:26] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 11
[23:00:27] Unexpected error hit on line 53128557
[23:00:27] ERROR: moving to the beginning of the next molecule
[23:00:27] The 2 defining bonds for an atropisomer are co-planar - atoms are: 11 5
[23:00:27] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 10
[23:00:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 13
[23:00:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[23:00:28] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[23:00:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 1 2
[23:00:28] The 2 defining bonds for an atropisomer are co-planar - atoms are: 5 12
[23:00:29] The 2 defining bonds for an atropisomer are co-planar - atoms are: 4 9
[23:00:29] The 2 defining bonds for an atropisomer are co-planar - atoms are: 9 4
[23:00:30] The 2 defining bonds for an atropisome

Processed 800000 molecules...


[23:00:36] The 2 defining bonds for an atropisomer are co-planar - atoms are: 15 11
[23:00:38] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 8


Processed 810000 molecules...


[23:00:55] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 5


Processed 820000 molecules...
Processed 830000 molecules...


[23:01:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1
[23:01:13] Explicit valence for atom # 12 Si, 5, is greater than permitted
[23:01:16] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 7


Processed 840000 molecules...


[23:01:17] Both bonds on one end of an atropisomer are on the same side - atoms are: 2 9
[23:01:18] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 5
[23:01:18] Explicit valence for atom # 5 Si, 5, is greater than permitted
[23:01:21] Unexpected error hit on line 56391017
[23:01:21] ERROR: moving to the beginning of the next molecule
[23:01:22] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 6


Processed 850000 molecules...


[23:01:34] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 8


Processed 860000 molecules...


[23:01:37] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 7
[23:01:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 5
[23:01:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 5
[23:01:39] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 9
[23:01:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 9 5
[23:01:39] The 2 defining bonds for an atropisomer are co-planar - atoms are: 10 9
[23:01:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 10 5
[23:01:39] Both bonds on one end of an atropisomer are on the same side - atoms are: 1 3
[23:01:40] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 2
[23:01:40] The 2 defining bonds for an atropisomer are co-planar - atoms are: 0 9
[23:01:40] The 2 defining bonds for an atropisomer are co-planar - atoms are: 14 9
[23:01:43] Explicit valence for atom # 14 Si

Processed 870000 molecules...
Processed 880000 molecules...


[23:02:00] Both bonds on one end of an atropisomer are on the same side - atoms are: 5 3


Processed 890000 molecules...


[23:02:10] Both bonds on one end of an atropisomer are on the same side - atoms are: 6 2
[23:02:12] The 2 defining bonds for an atropisomer are co-planar - atoms are: 6 5
[23:02:12] Both bonds on one end of an atropisomer are on the same side - atoms are: 4 8
[23:02:14] Both bonds on one end of an atropisomer are on the same side - atoms are: 0 1


Finished processing and saved to NPZ!


In [16]:
import numpy as np

data = np.load(r"D:\molecule3d\data\processed\molecules_1st_million.npz", allow_pickle=True)

print(data.files)
n = 42
print(data["atom_types"][n])
print(data["coords"][n])
print(data["smiles"][n])
print(data["selfies"][n])

['atom_types', 'coords', 'smiles', 'selfies']
['C', 'C', 'O', 'O', 'C', 'O', 'O', 'O', 'H', 'H', 'H', 'H']
[[0.7266, -0.0447, -0.0413], [0.1404, -0.6432, -1.3245], [-1.0468, -0.8979, -1.4122], [1.017, -0.8491, -2.2972], [0.3713, -0.9147, 1.1829], [1.2331, -1.1713, 1.9948], [-0.8935, -1.3019, 1.2849], [2.1213, 0.0962, -0.1485], [0.2426, 0.9341, 0.1009], [1.896, -0.593, -1.9344], [-1.3508, -1.1242, 0.4253], [2.4855, -0.3245, 0.6604]]
[H]OC(=O)C([H])(O[H])C(=O)O[H]
[H][O][C][=Branch1][C][=O][C][Branch1][C][H][Branch1][Ring1][O][H][C][=Branch1][C][=O][O][H]
