# Building POM-Terphenyl Polymers using mbuild

Here we use `mbuild` to read in a SMILES string of a terphenyl monomer and build an n-residue polymer from the monomer.

In [1]:
import mbuild as mb
import numpy as np
from mbuild.lib.recipes.polymer import Polymer
import subprocess



First we get the POM-terphenyl monomer from a smiles string.

In [2]:
comp = mb.load('COc3ccc(c1cccc(C=O)c1)c(c2ccc([C@@H](C)N)cc2)c3', smiles = True, name="POM")

I output all the indexes of hydrogen atoms because we will uses these indexes for extending the polymer later on.

In [3]:
for i, atom in enumerate(comp):
    if atom.name == "H":
        print(i, atom)

25 <H pos=([-0.2619 -0.6738 -0.1057]), 1 bonds, id: 139769099224256>
26 <H pos=([-0.3272 -0.5848  0.0369]), 1 bonds, id: 139769099223536>
27 <H pos=([-0.3757 -0.5363 -0.1318]), 1 bonds, id: 139769099223488>
28 <H pos=([-0.3936 -0.3462  0.0261]), 1 bonds, id: 139769105986896>
29 <H pos=([-0.3904 -0.1125  0.0952]), 1 bonds, id: 139769105986176>
30 <H pos=([-0.0188  0.0341  0.2297]), 1 bonds, id: 139769105988288>
31 <H pos=([-0.0211  0.2676  0.3082]), 1 bonds, id: 139769105989008>
32 <H pos=([-0.1868  0.4276  0.2205]), 1 bonds, id: 139769099224112>
33 <H pos=([-0.3797  0.483   0.0736]), 1 bonds, id: 139769099225216>
34 <H pos=([-0.3514  0.1181 -0.0307]), 1 bonds, id: 139769099226080>
35 <H pos=([ 0.1831 -0.1982  0.0834]), 1 bonds, id: 139769099227136>
36 <H pos=([ 0.3893 -0.0704  0.0507]), 1 bonds, id: 139769105988192>
37 <H pos=([ 0.4012  0.2527 -0.1548]), 1 bonds, id: 139769105989104>
38 <H pos=([0.5627 0.2867 0.0274]), 1 bonds, id: 139769105986752>
39 <H pos=([0.5016 0.1413 0.115 ]), 1

`mbuild` comes with a nice tool to visualize Compounds built into jupyter-notebooks. Using the object from `py3Dmol` we can coloro the atoms to identify the indices needed to make substiutions when building the polymer.

In [4]:
view = comp.visualize(show_ports=True)
style = {
                "stick": {"radius": 0.2, "color": "grey"},
                "sphere": {"scale": 0.3, "color" : "black"},
    }
view.setStyle({'model': -1, 'serial':43},style)
view.setStyle({'model': -1, 'serial':34},style)

  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


<py3Dmol.view at 0x7f1e87e2e3e0>

We also make the two capping compounds using SMILES strings:

In [5]:
cap_o = mb.load('CO', smiles = True)
cap_o.visualize()

  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


<py3Dmol.view at 0x7f1e8785e410>

In [6]:
cap_n = mb.load('CC(C)(C)OC=O', smiles = True)
cap_n.visualize()

  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


<py3Dmol.view at 0x7f1e8785f0a0>

Here we use the `Polymer` object to build a hexamer from the molecules we built in the previous cells. `Polymer.add_monomer()` is used to add the monomers to the polymer object. `Polymer.add_end_groups()` adds the capping groups to the object with `"head"` and `"tail"` labels for the each end of the polymer. `replace = True` will replace the specified atoms with the next residue. `indices` is used to specify which atom will be replaced in each group. Finally, when we call `Polymer.build()`, the polymer is built with the specified `n` residues and the provided capping residues. `sequence` is used if multiple monomers are provided.

In [7]:
chain = Polymer()
chain.add_monomer(compound=comp,
                  indices=[33, 42],
                  separation=.15,
                  replace=True,
                  # orientation = [[1,0,0],[1,0,0]]
                 )
chain.add_end_groups(compound = cap_o,
                     index = -1,
                     separation=0.15,
                     label="head",
                     duplicate = False
                    )

chain.add_end_groups(compound = cap_n,
                     index = -1,
                     separation=0.15,
                     label="tail",
                     duplicate = False
                    )

chain.build(n=6, sequence='A')

In [8]:
chain.visualize(show_ports=True)

  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


<py3Dmol.view at 0x7f1e855bd480>

Next we add specific residue labels for the componenets of the `Polymer` object. Here we label the monomers as HEX and the capping moieties as CAP.

In [9]:
print(chain.labels)
for label in chain.labels["monomer"]:
    label.name = "HEX"
    print(label)
for label in chain.labels["Compound"]:
    label.name = "CAP"
    print(label)

OrderedDict([('monomer', [<Compound 44 particles, 46 bonds, non-periodic, id: 139769063334832>, <Compound 44 particles, 46 bonds, non-periodic, id: 139769063504864>, <Compound 44 particles, 46 bonds, non-periodic, id: 139769099439216>, <Compound 44 particles, 46 bonds, non-periodic, id: 139769099440080>, <Compound 44 particles, 46 bonds, non-periodic, id: 139769063911104>, <Compound 44 particles, 46 bonds, non-periodic, id: 139769064136976>]), ('monomer[0]', <Compound 44 particles, 46 bonds, non-periodic, id: 139769063334832>), ('monomer[1]', <Compound 44 particles, 46 bonds, non-periodic, id: 139769063504864>), ('monomer[2]', <Compound 44 particles, 46 bonds, non-periodic, id: 139769099439216>), ('monomer[3]', <Compound 44 particles, 46 bonds, non-periodic, id: 139769099440080>), ('monomer[4]', <Compound 44 particles, 46 bonds, non-periodic, id: 139769063911104>), ('monomer[5]', <Compound 44 particles, 46 bonds, non-periodic, id: 139769064136976>), ('Compound', [<Compound 5 particles,

We save these as a pdb file and provide the names of the residues to include in the file.

In [10]:
chain.save("pom_hexamer_mbuild.pdb", overwrite=True, residues=["HEX", "CAP"])

  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


Using Gromacs I generate a new gro file with the correct residue labels. `mbuild` doesn't seem to label residues correctly when writing `.gro` files.

In [11]:
! gmx editconf -f pom_hexamer_mbuild.pdb -o pom_hexamer_mbuild.gro

                     :-) GROMACS - gmx editconf, 2022.4 (-:

Executable:   /usr/local/bin/gmx
Data prefix:  /usr/local
Working dir:  /home/tfobe/Research/heteropolymer_simulations/examples/build_polymer/pom
Command line:
  gmx editconf -f pom_hexamer_mbuild.pdb -o pom_hexamer_mbuild.gro

Note that major changes are planned in future for editconf, to improve usability and utility.
Read 285 atoms
Volume: 66.981 nm^3, corresponds to roughly 30100 electrons
No velocities found

Back Off! I just backed up pom_hexamer_mbuild.gro to ./#pom_hexamer_mbuild.gro.2#

GROMACS reminds you: "Misslycka kan man med all kod" (Mats Nylen)



Lastly, I use openBabel to generate a `.mol` file for use in the OpenFF parameter assignment workflow.

In [12]:
! obabel -ipdb pom_hexamer_mbuild.pdb -omol pom_hexamer_mbuild.mol -O pom_hexamer_mbuild.mol

*** Open Babel Error  in ReadMolecule
  ERROR: not a valid PDB file

1 molecule converted


In [14]:
n_residues = [4,6,8,10]
residue_labels = ["TET", "HEX", "OCT", "DEC"]
file_names = ["pom_tetramer_mbuild", "pom_hexamer_mbuild", "pom_octamer_mbuild", "pom_decamer_mbuild"]
for i in range(len(n_residues)):
    # Generate polymer
    chain = Polymer()
    chain.add_monomer(compound=comp,
                      indices=[25, 40],
                      separation=.15,
                      replace=True,
                      # orientation = [[0,-1,0],[1,0,0]]
                     )
    chain.add_end_groups(compound = cap_o,
                         index = -1,
                         separation=0.15,
                         label="head",
                         duplicate = False
                        )

    chain.add_end_groups(compound = cap_n,
                         index = -1,
                         separation=0.15,
                         label="tail",
                         duplicate = False
                        )

    chain.build(n=n_residues[i], sequence='A')

    # Rotate peptide bond
    for bond in chain.bonds():
        if bond[0].name == "N":
            if bond[1].n_direct_bonds == 3:
                print("Rotating bond:", bond, "by", np.pi/2)
                chain.rotate_dihedral(bond, np.pi/2)

        if bond[1].name == "N":
            if bond[0].n_direct_bonds == 3:
                print("Rotating bond:", bond, "by", np.pi/2)
                chain.rotate_dihedral(bond, np.pi/2)  


    # Relabel chains
    for label in chain.labels["monomer"]:
        label.name = residue_labels[i]
        print(label)
    for label in chain.labels["Compound"]:
        label.name = "CAP"
        print(label)
            
            
    chain.save(file_names[i] + ".pdb", overwrite=True, residues=[residue_labels[i], "CAP"])
    
    subprocess.run(["gmx", "editconf", "-f", file_names[i] + ".pdb", "-o", file_names[i]+ ".gro"])
    subprocess.run(["obabel", "-ipdb", file_names[i] + ".pdb", "-omol", file_names[i] + ".mol",  "-O", file_names[i] + ".mol"])
    subprocess.run(["renumber_pdb_atoms", "-f", file_names[i] + ".pdb", "-o", file_names[i] + "_renum.pdb"])

<TET 44 particles, 46 bonds, non-periodic, id: 139769782695296>
<TET 44 particles, 46 bonds, non-periodic, id: 139769782692800>
<TET 44 particles, 46 bonds, non-periodic, id: 139769782937312>
<TET 44 particles, 46 bonds, non-periodic, id: 139769783040656>
<CAP 5 particles, 4 bonds, non-periodic, id: 139769099234912>
<CAP 16 particles, 15 bonds, non-periodic, id: 139769782685504>
Note that major changes are planned in future for editconf, to improve usability and utility.
Read 197 atoms
Volume: 27.7809 nm^3, corresponds to roughly 12500 electrons
No velocities found


  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


*** Open Babel Error  in ReadMolecule
  ERROR: not a valid PDB file

1 molecule converted


<HEX 44 particles, 46 bonds, non-periodic, id: 139769781740992>
<HEX 44 particles, 46 bonds, non-periodic, id: 139769783728688>
<HEX 44 particles, 46 bonds, non-periodic, id: 139769786090064>
<HEX 44 particles, 46 bonds, non-periodic, id: 139769786008096>
<HEX 44 particles, 46 bonds, non-periodic, id: 139769787590560>
<HEX 44 particles, 46 bonds, non-periodic, id: 139769063855904>
<CAP 5 particles, 4 bonds, non-periodic, id: 139769781561920>
<CAP 16 particles, 15 bonds, non-periodic, id: 139769781554576>
Note that major changes are planned in future for editconf, to improve usability and utility.
Read 285 atoms
Volume: 60.1881 nm^3, corresponds to roughly 27000 electrons
No velocities found


  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


*** Open Babel Error  in ReadMolecule
  ERROR: not a valid PDB file

1 molecule converted


<OCT 44 particles, 46 bonds, non-periodic, id: 139769781841264>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769781843136>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769785925584>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769785269024>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769785482928>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769785496048>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769784155392>
<OCT 44 particles, 46 bonds, non-periodic, id: 139769784401152>
<CAP 5 particles, 4 bonds, non-periodic, id: 139769783321792>
<CAP 16 particles, 15 bonds, non-periodic, id: 139769783331776>
Note that major changes are planned in future for editconf, to improve usability and utility.
Read 373 atoms
Volume: 69.5382 nm^3, corresponds to roughly 31200 electrons
No velocities found


  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


*** Open Babel Error  in ReadMolecule
  ERROR: not a valid PDB file

1 molecule converted


<DEC 44 particles, 46 bonds, non-periodic, id: 139769780508304>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769780507440>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769780599728>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769780740992>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769780878976>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769781228576>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769779397648>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769779404608>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769779873024>
<DEC 44 particles, 46 bonds, non-periodic, id: 139769779496288>
<CAP 5 particles, 4 bonds, non-periodic, id: 139769782377376>
<CAP 16 particles, 15 bonds, non-periodic, id: 139769782384240>


  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(
  warn(


Note that major changes are planned in future for editconf, to improve usability and utility.
Read 461 atoms
Volume: 82.5012 nm^3, corresponds to roughly 37100 electrons
No velocities found


*** Open Babel Error  in ReadMolecule
  ERROR: not a valid PDB file

1 molecule converted
