Permalink
Cannot retrieve contributors at this time
Fetching contributors…
| <?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.1d1 20130915//EN" "JATS-archivearticle1.dtd"><article article-type="research-article" dtd-version="1.1d1" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink"><front><journal-meta><journal-id journal-id-type="nlm-ta">elife</journal-id><journal-id journal-id-type="hwp">eLife</journal-id><journal-id journal-id-type="publisher-id">eLife</journal-id><journal-title-group><journal-title>eLife</journal-title></journal-title-group><issn publication-format="electronic">2050-084X</issn><publisher><publisher-name>eLife Sciences Publications, Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">01370</article-id><article-id pub-id-type="doi">10.7554/eLife.01370</article-id><article-categories><subj-group subj-group-type="display-channel"><subject>Research article</subject></subj-group><subj-group subj-group-type="heading"><subject>Biophysics and structural biology</subject></subj-group></article-categories><title-group><article-title>Encounter complexes and dimensionality reduction in protein–protein association</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes" id="author-7092"><name><surname>Kozakov</surname><given-names>Dima</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="corresp" rid="cor1">*</xref><xref ref-type="other" rid="par-1"/><xref ref-type="other" rid="par-4"/><xref ref-type="other" rid="par-5"/><xref ref-type="other" rid="par-6"/><xref ref-type="fn" rid="con1"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-8128"><name><surname>Li</surname><given-names>Keyong</given-names></name><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="fn" rid="con2"/><xref ref-type="fn" rid="conf5"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-8121"><name><surname>Hall</surname><given-names>David R</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="fn" rid="con3"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-8122"><name><surname>Beglov</surname><given-names>Dmitri</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="con4"/><xref ref-type="fn" rid="conf3"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-8123"><name><surname>Zheng</surname><given-names>Jiefu</given-names></name><xref ref-type="aff" rid="aff2"/><xref ref-type="fn" rid="con9"/><xref ref-type="fn" rid="conf5"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-8124"><name><surname>Vakili</surname><given-names>Pirooz</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="aff" rid="aff4"/><xref ref-type="fn" rid="con5"/><xref ref-type="fn" rid="conf5"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-8125"><name><surname>Schueler-Furman</surname><given-names>Ora</given-names></name><xref ref-type="aff" rid="aff5"/><xref ref-type="other" rid="par-5"/><xref ref-type="fn" rid="con6"/><xref ref-type="fn" rid="conf5"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" corresp="yes" id="author-8117"><name><surname>Paschalidis</surname><given-names>Ioannis Ch</given-names></name><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff3"/><xref ref-type="corresp" rid="cor3">*</xref><xref ref-type="other" rid="par-1"/><xref ref-type="fn" rid="con7"/><xref ref-type="fn" rid="conf5"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" corresp="yes" id="author-8118"><name><surname>Clore</surname><given-names>G Marius</given-names></name><xref ref-type="aff" rid="aff6"/><xref ref-type="corresp" rid="cor4">*</xref><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con8"/><xref ref-type="fn" rid="conf5"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" corresp="yes" id="author-8119"><name><surname>Vajda</surname><given-names>Sandor</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff7"/><xref ref-type="corresp" rid="cor2">*</xref><xref ref-type="other" rid="par-2"/><xref ref-type="other" rid="par-4"/><xref ref-type="fn" rid="con10"/><xref ref-type="fn" rid="conf4"/><xref ref-type="other" rid="dataro1"/></contrib><aff id="aff1"><institution content-type="dept">Department of Biomedical Engineering</institution>, <institution>Boston University</institution>, <addr-line><named-content content-type="city">Boston</named-content></addr-line>, <country>United States</country></aff><aff id="aff2"><institution content-type="dept">Department of Electrical and Computer Engineering</institution>, <institution>Boston University</institution>, <addr-line><named-content content-type="city">Boston</named-content></addr-line>, <country>United States</country></aff><aff id="aff3"><institution content-type="dept">Division of Systems Engineering</institution>, <institution>Boston University</institution>, <addr-line><named-content content-type="city">Boston</named-content></addr-line>, <country>United States</country></aff><aff id="aff4"><institution content-type="dept">Department of Mechanical Engineering</institution>, <institution>Boston University</institution>, <addr-line><named-content content-type="city">Boston</named-content></addr-line>, <country>United States</country></aff><aff id="aff5"><institution content-type="dept">Department of Microbiology and Molecular Genetics</institution>, <institution>Hadassah Medical School, The Hebrew University of Jerusalem</institution>, <addr-line><named-content content-type="city">Jerusalem</named-content></addr-line>, <country>Israel</country></aff><aff id="aff6"><institution content-type="dept">Laboratory of Chemical Physics</institution>, <institution>National Institute of Diabetes and Digestive and Kidney Diseases, National Institutes of Health</institution>, <addr-line><named-content content-type="city">Bethesda</named-content></addr-line>, <country>United States</country></aff><aff id="aff7"><institution content-type="dept">Department of Chemistry</institution>, <institution>Boston University</institution>, <addr-line><named-content content-type="city">Boston</named-content></addr-line>, <country>United States</country></aff></contrib-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Roux</surname><given-names>Benoit</given-names></name><role>Reviewing editor</role><aff><institution>University of Chicago</institution>, <country>United States</country></aff></contrib></contrib-group><author-notes><corresp id="cor1"><label>*</label>For correspondence: <email>midas@bu.edu</email> (DK);</corresp><corresp id="cor2"><label>*</label>For correspondence: <email>vajda@bu.edu</email> (SV);</corresp><corresp id="cor3"><label>*</label>For correspondence: <email>yannisp@bu.edu</email> (ICP);</corresp><corresp id="cor4"><label>*</label>For correspondence: <email>mariusc@intra.niddk.nih.gov</email> (GMC)</corresp><fn fn-type="con" id="equal-contrib"><label>†</label><p>These authors contributed equally to this work</p></fn></author-notes><pub-date date-type="pub" publication-format="electronic"><day>08</day><month>04</month><year>2014</year></pub-date><pub-date pub-type="collection"><year>2014</year></pub-date><volume>3</volume><elocation-id>e01370</elocation-id><history><date date-type="received"><day>14</day><month>08</month><year>2013</year></date><date date-type="accepted"><day>22</day><month>02</month><year>2014</year></date></history><permissions><license xlink:href="http://creativecommons.org/publicdomain/zero/1.0/"><license-p>This is an open-access article, free of all copyright, and may be freely reproduced, distributed, transmitted, modified, built upon, or otherwise used by anyone for any lawful purpose. The work is made available under the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/publicdomain/zero/1.0/">Creative Commons CC0 public domain dedication</ext-link>.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="elife01370.pdf"/><abstract><object-id pub-id-type="doi">10.7554/eLife.01370.001</object-id><p>An outstanding challenge has been to understand the mechanism whereby proteins associate. We report here the results of exhaustively sampling the conformational space in protein–protein association using a physics-based energy function. The agreement between experimental intermolecular paramagnetic relaxation enhancement (PRE) data and the PRE profiles calculated from the docked structures shows that the method captures both specific and non-specific encounter complexes. To explore the energy landscape in the vicinity of the native structure, the nonlinear manifold describing the relative orientation of two solid bodies is projected onto a Euclidean space in which the shape of low energy regions is studied by principal component analysis. Results show that the energy surface is canyon-like, with a smooth funnel within a two dimensional subspace capturing over 75% of the total motion. Thus, proteins tend to associate along preferred pathways, similar to sliding of a protein along DNA in the process of protein-DNA recognition.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.001">http://dx.doi.org/10.7554/eLife.01370.001</ext-link></p></abstract><abstract abstract-type="executive-summary"><object-id pub-id-type="doi">10.7554/eLife.01370.002</object-id><title>eLife digest</title><p>Proteins rarely act alone. Instead, they tend to bind to other proteins to form structures known as complexes. When two proteins come together to form a complex, they twist and turn through a series of intermediate states before they form the actual complex. These intermediate states are difficult to study because they don’t last for very long, which means that our knowledge of how complexes are formed remains incomplete.</p><p>One promising approach for studying the formation of complexes is called paramagnetic relaxation enhancement. In this technique certain areas in one of the proteins are labelled with magnetic particles, which produce signals when the two proteins are close to each other. Repeating the measurement several times with the magnetic particles in different positions provides information about the overall structure of the complex. Computational modelling can then be used to work out the fine details of the structure, including the shapes of the intermediate structures made by the proteins as they interact.</p><p>A computer method called docking can be used to predict the most favourable positions that the proteins can take, relative to one another, in a complex. This involves calculating the energy contained in the system, with the correct structure having the lowest energy. Docking methods also predict protein models with slightly higher energies, but with structures that are radically different. Modellers usually ignore these structures, but comparing the docking results to paramagnetic relaxation enhancement data, Kozakov et al. found that these structures actually represent the intermediate states.</p><p>Analysing the structure of the intermediate states revealed that the movement of the two proteins relative to one another is severely restricted as they form the final complex. Kozakov et al. found that proteins associate along preferred pathways, similar to the way a protein slides along DNA in the process of protein-DNA recognition. Knowing that the movement of the proteins is restricted in this way will enable researchers to improve the efficiency of docking calculations.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.002">http://dx.doi.org/10.7554/eLife.01370.002</ext-link></p></abstract><kwd-group kwd-group-type="author-keywords"><title>Author keywords</title><kwd>encounter landscapes</kwd><kwd>FFT sampling</kwd><kwd>protein–protein interactions</kwd></kwd-group><kwd-group kwd-group-type="research-organism"><title>Research organism</title><kwd>none</kwd></kwd-group><funding-group><award-group id="par-1"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000002</institution-id><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>GM93147</award-id><principal-award-recipient><name><surname>Kozakov</surname><given-names>Dima</given-names></name><name><surname>Paschalidis</surname><given-names>Ioannis Ch</given-names></name></principal-award-recipient></award-group><award-group id="par-2"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000002</institution-id><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>GM61867</award-id><principal-award-recipient><name><surname>Vajda</surname><given-names>Sandor</given-names></name></principal-award-recipient></award-group><award-group id="par-3"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000002</institution-id><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>Intramural program of NIDDK</award-id><principal-award-recipient><name><surname>Clore</surname><given-names>G Marius</given-names></name></principal-award-recipient></award-group><award-group id="par-4"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000001</institution-id><institution>National Science Foundation</institution></institution-wrap></funding-source><award-id>DBI1147082</award-id><principal-award-recipient><name><surname>Kozakov</surname><given-names>Dima</given-names></name><name><surname>Vajda</surname><given-names>Sandor</given-names></name></principal-award-recipient></award-group><award-group id="par-5"><funding-source><institution-wrap><institution>US Israel Binational Science Foundation</institution></institution-wrap></funding-source><award-id>2009418</award-id><principal-award-recipient><name><surname>Kozakov</surname><given-names>Dima</given-names></name><name><surname>Schueler-Furman</surname><given-names>Ora</given-names></name></principal-award-recipient></award-group><award-group id="par-6"><funding-source><institution-wrap><institution>Russian Ministry of Education and Science</institution></institution-wrap></funding-source><award-id>14.A18.21.1973</award-id><principal-award-recipient><name><surname>Kozakov</surname><given-names>Dima</given-names></name></principal-award-recipient></award-group><funding-statement>The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication.</funding-statement></funding-group><custom-meta-group><custom-meta><meta-name>elife-xml-version</meta-name><meta-value>2</meta-value></custom-meta><custom-meta specific-use="meta-only"><meta-name>Author impact statement</meta-name><meta-value>Analysis of protein–protein encounter complexes shows that proteins associate along preferred pathways, similar to the sliding of a protein along DNA.</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Interactions between proteins play a central role in various aspects of the structural and functional organization of the cell. To recognize its partner, a protein must align its binding interface, usually a small fraction of the total surface, with a similarly small binding interface on the other protein (<xref ref-type="bibr" rid="bib3">Berg and von Hippel, 1985</xref>; <xref ref-type="bibr" rid="bib46">Ubbink, 2009</xref>). Since all interactions are of relatively short range, the process must start with a diffusive search governed by Brownian motion, which brings the proteins to a ‘macrocollision’ to yield a transition state also known as the encounter complex (<xref ref-type="bibr" rid="bib3">Berg and von Hippel, 1985</xref>; <xref ref-type="bibr" rid="bib48">von Hippel and Berg, 1989</xref>). The encounter complex can be thought of as an ensemble of conformations in which the two molecules can rotationally diffuse along each other, or participate in a series of ‘microcollisions’ that properly align the reactive groups. The second step of association consists of conformational rearrangements to the native complex. While it has been generally recognized that association proceeds through a transition state, little was known of the encounter complex structures and configurations as their populations are low, their lifetimes are short, and they are difficult to trap, rendering them essentially invisible to conventional structural and biophysical methods (<xref ref-type="bibr" rid="bib19">Iwahara and Clore, 2006</xref>).</p><p>Novel experimental and improved computational methods, developed during the last decade, have the potential to provide information leading to better understanding of the nature of encounter complexes. On the experimental side, the major progress is due to the application of NMR paramagnetic relaxation enhancement (PRE), a technique that is exquisitely sensitive to the presence of lowly populated states in the fast exchange regime (<xref ref-type="bibr" rid="bib9">Clore, 2008</xref>; <xref ref-type="bibr" rid="bib10">Clore and Iwahara, 2009</xref>; <xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>). The detection of such intermediates requires introducing paramagnetic labels, one at a time, at a few sites on one of the interacting proteins, and measuring the transverse paramagnetic relaxation enhancement (PRE) rates, <italic>Γ</italic><sub>2</sub>, of the backbone amide protons (<sup>1</sup>H<sub>N</sub>) of the partner protein (<xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>). In a fast exchanging system, the observed value of <italic>Γ</italic><sub><italic>2</italic></sub> is the weighted average of the values for the various states present in solution (<xref ref-type="bibr" rid="bib20">Iwahara et al., 2004</xref>; <xref ref-type="bibr" rid="bib19">Iwahara and Clore, 2006</xref>). Because <italic>Γ</italic><sub>2</sub> is dependent on the inverse sixth power of the distance (<<italic>r</italic><sup>−6</sup>>) between the unpaired electron on the paramagnetic center and the observed proton, and because the <italic>Γ</italic><sub>2</sub> rates at short distances are very large owing to the large magnetic moment of the unpaired electrons, low-population intermediates can be detected. In particular, the observed intermolecular <sup>1</sup>H<sub>N</sub>−<italic>Γ</italic><sub>2</sub> rates and those back-calculated from the structure of the native complex generally differ for a number of residues, revealing regions that participate in transitional interactions (<xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>).</p><p>Paramagnetic relaxation enhancement (PRE) techniques can provide distributions of distances between a paramagnetic ion and protons, indicating the presence and relative ratio of conformational sub-ensembles (<xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>; <xref ref-type="bibr" rid="bib42">Suh et al., 2007</xref>; <xref ref-type="bibr" rid="bib10">Clore and Iwahara, 2009</xref>; <xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>), but determining the detailed structure of encounter complexes requires computational approaches. A semi-quantitative depiction of the minor species can be obtained by using restrained rigid-body simulated annealing refinement to minimize the difference between observed and calculated <sup>1</sup>H<sub>N</sub>−<italic>Γ</italic><sub>2</sub> rates (<xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>; <xref ref-type="bibr" rid="bib22">Kim et al., 2008</xref>). However, with the development of docking methods it is possible to globally sample the entire conformational space of two interacting proteins, generating all low energy states. Although in some cases binding is inherently coupled with folding (<xref ref-type="bibr" rid="bib38">Shoemaker et al., 2000</xref>; <xref ref-type="bibr" rid="bib51">Zheng et al., 2012</xref>), a large class of protein complexes can be adequately described by a model that assumes essentially rigid association, possibly followed by refinement that allows for local changes in side chains and interacting loops (<xref ref-type="bibr" rid="bib39">Smith and Sternberg, 2002</xref>; <xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>; <xref ref-type="bibr" rid="bib47">Vajda and Kozakov, 2009</xref>). As demonstrated by the results of CAPRI (Critical Assessment of Prediction of Interactions) communitywide protein docking experiment, for such cases modern computational docking methods, including automated servers, are capable of generating docked conformations that agree well with the X-ray structure of the complex (<xref ref-type="bibr" rid="bib28">Lensink and Wodak, 2013</xref>). In particular, our program PIPER, based on the Fast Fourier transform (FFT) correlation approach, globally and systematically samples the conformational space of two interacting proteins on a dense grid using a physics based energy function (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>). The program is implemented in the heavily used server ClusPro (<xref ref-type="bibr" rid="bib11">Comeau et al., 2007</xref>), which yields good results when docking X-ray structures of two proteins with at most moderate backbone conformational changes upon binding (<xref ref-type="bibr" rid="bib25">Kozakov et al., 2010</xref>). Based on the results of CAPRI, Cluspro has been the best protein–protein docking server for the last 5 years (<xref ref-type="bibr" rid="bib23">Kozakov et al., 2013</xref>; <xref ref-type="bibr" rid="bib28">Lensink and Wodak, 2013</xref>).</p><p>It is well known that, in addition to near-native structures, docking generally yields a large number of models that are similar to near-native ones in terms of energy, but may substantially differ in terms of geometry (<xref ref-type="bibr" rid="bib47">Vajda and Kozakov, 2009</xref>). Since such ‘false positive’ models do not predict the final bound complex, they are usually regarded as artifacts. However, using molecular mechanics energy functions without ‘built-in’ information on the native state it is reasonable to assume that the alternative low energy models represent encounter complexes that, in view of their favorable interactions, may occur along association pathways. Accordingly, we show here that using the large ensemble of low energy structures generated by docking provides better approximation of experimental PRE profiles than the one calculated only from the coordinates of the final complex. Since in docking calculations we start from unbound protein structures and systematically sample the entire conformational space, based on this result we can easily generate ensembles of encounter complexes for any pair of associating proteins.</p><p>Once it is established that the energy function used for sampling the conformational space enables us to accurately predict both the native state and the ensemble of encounter complexes, and thus the energy function is valid beyond selecting the native structure of the complex, we proceed to characterizing the energy landscape in the 6D translational/rotational space near the native state (<xref ref-type="bibr" rid="bib29">McCammon, 1998</xref>; <xref ref-type="bibr" rid="bib5">Camacho et al., 1999</xref>; <xref ref-type="bibr" rid="bib50">Zhang et al., 1999</xref>; <xref ref-type="bibr" rid="bib45">Tovchigrechko and Vakser, 2001</xref>). We focus on the main binding funnel in a neighborhood of the native state, which is the most important region of the conformational space, containing over 90% of complex structures observed in the PRE experiments (<xref ref-type="bibr" rid="bib19">Iwahara and Clore, 2006</xref>; <xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>; <xref ref-type="bibr" rid="bib10">Clore and Iwahara, 2009</xref>; <xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>). Since rigid body association occurs in a low dimensional space, the shape of the binding energy landscape can be studied in detail, in contrast to protein folding, which occurs in a very high dimensional space (<xref ref-type="bibr" rid="bib12a">Dill and Chan, 1997</xref>). In spite of the low dimensionality, the analysis is far from simple in this highly curved space due to the interdependence of the coordinates (<xref ref-type="bibr" rid="bib32">Park, 1995</xref>; <xref ref-type="bibr" rid="bib33">Park and Ravani, 1997</xref>; <xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>; <xref ref-type="bibr" rid="bib30">Mirzaei et al., 2012</xref>). However, one can transform the rotational space into a product of axis-angle representations using complex exponentials (<xref ref-type="bibr" rid="bib33">Park and Ravani, 1997</xref>). These so-called exponential parameters create a local one-to-one mapping between the nonlinear manifold of potential conformations and an Euclidean space (<xref ref-type="bibr" rid="bib30">Mirzaei et al., 2012</xref>), and thus the shape of low energy regions in the conformational space can be studied by classical principal component analysis (PCA) in the Euclidean space. Using PCA we will be able to determine whether any subspace can accommodate a large fraction of the structures, and whether there are energy barriers that restrict the distribution of encounter complexes in the vicinity of the native state.</p><p>The most important result of our analysis is that the region of the space in a neighborhood of the native state invariably includes high energy barriers preventing the ligand from moving into a one- or two-dimensional restrictive subspace. Orthogonal to the restrictive subspace is a permissive subspace, in which the energy is relatively flat. Based on these results one can visualize the energy landscape as resembling a canyon-like terrain where the low energy areas (at the bottom of the canyon) lie in a lower dimensional subspace. Thus, within the range of physical interactions, two proteins sample only relatively small fractions of the conformational space, and converge toward the native state along preferred pathways. This result represents information that, in principle, could have been obtained by running molecular dynamics or Brownian dynamics simulations. However, a sufficiently dense sampling of conformational space by molecular dynamics is computationally very demanding, even when restricting considerations to a neighborhood of the native state (<xref ref-type="bibr" rid="bib49">Wang and Wade, 2003</xref>), whereas Brownian dynamics simulations usually rely on highly simplified protein models (<xref ref-type="bibr" rid="bib4">Camacho et al., 2000</xref>; <xref ref-type="bibr" rid="bib40">Spaar and Helms, 2005</xref>). In contrast, we use detailed all-atom models and map the energy surface using two different physics-based energy functions. As will be shown, these differences do not significantly affect the results of the principal component analysis, suggesting that the reduction of dimensionality is an inherent property of the free energy landscape in protein–protein association.</p></sec><sec id="s2" sec-type="results"><title>Results</title><sec id="s2-1"><title>Prediction of encounter complex ensembles</title><p>We focused on the modeling of the association between the N-terminal domain of Enzyme I (EIN) and the histidine-containing phosphocarrier protein (HPr) (<xref ref-type="fig" rid="fig1">Figure 1A</xref>), because the complex has been studied in a series of PRE titration experiments (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>). Specific association between the two proteins occurs in the first step of the bacterial phosphotransfer system, resulting in phosphoryl transfer between EIN and HPr upon proper alignment of active site histidines of the two sides of the interface (<xref ref-type="bibr" rid="bib15">Garrett et al., 1999</xref>). The binding has an equilibrium dissociation constant of 4.3 μM (<xref ref-type="bibr" rid="bib41">Suh et al., 2008</xref>). For the computational study of encounter complexes we have placed the center of EIN at the origin of a coordinate system, and systematically sampled the entire rotational/translational space of HPr. Unbound structures were used both for the receptor, EIN (chain A from PDB entry 1ZYM) and for the ligand, HPr (chain P from PDB entry 2JEL). Sampling was performed using the docking program PIPER, which performs exhaustive evaluation of a physics-based energy function in discretized 6D space of mutual orientations of two proteins using the Fast Fourier transform (FFT) correlation approach (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>). We sample 70,000 rotations, which approximately correspond to sampling at every 5° in the space of Euler angles. In the translational space, the sampling is defined by the 1.0 Å grid cell size. PIPER is used with a ‘smooth’ energy function that includes terms describing attractive and repulsive van der Waals interactions, electrostatic interactions calculated by a simplified generalized Born-type expression, and a desolvation terms, the latter represented by a pairwise interaction potential (<xref ref-type="bibr" rid="bib8">Chuang et al., 2008</xref>). We call the energy function ‘smooth’ because the repulsive contributions to the van der Waals interaction are selected to allow for a certain amount of overlaps.<fig-group><fig id="fig1" position="float"><object-id pub-id-type="doi">10.7554/eLife.01370.003</object-id><label>Figure 1.</label><caption><title>Docking results for the EIN–HPr complex.</title><p>Unbound structures were used both for the receptor, EIN (chain A from PDB entry 1ZYM) and for the ligand, HPr (chain P from PDB entry 2JEL). Encounter complexes were generated using Fast Fourier transform (FFT) based sampling. (<bold>A</bold>) Cartoon of the specific complex formed by EIN and HPr, shown in grey and yellow, respectively. The locations of the paramagnetic tags E5C-EDTA-Mn<sup>+</sup> and E32C-EDTA-Mn<sup>2+</sup> on HPr are encircled and are shown in red and blue, respectively. (<bold>B</bold>) Centers of HPr structures in the encounter complex ensemble. Colors indicate classification as follows (<italic>8</italic>): blue, Class I (i.e., overlapping with the specific complex); magenta, patch 1 of Class II (i.e., non-overlapping) positions; red, patch 2 of Class II positions; and pink, additional Class II position outside the main patches. (<bold>C</bold>) Ligand IRMSD vs PIPER energy score. (<bold>D</bold>) Two representative HPr poses, colored light blue and dark blue, from Class I. (<bold>E</bold>) Two representative HPr poses (in different shades of magenta) from Patch 1 of Class II. (<bold>F</bold>) View of the EIN–HPr complex and the centers of HPr poses after rotating 180° around the vertical axis (the bound HPr is now on the left side, almost completely hidden by EIN). (<bold>G</bold>) Representative HPr poses (in different shades of red) from Patch 2 of Class II, shown in the rotated view.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.003">http://dx.doi.org/10.7554/eLife.01370.003</ext-link></p></caption><graphic xlink:href="elife01370f001"/></fig><fig id="fig1s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.004</object-id><label>Figure 1—figure supplement 1.</label><caption><title>Rotamers of the paramagnetic labels E5C-EDTA-Mn<sup>2+</sup> and E32C-EDTA-Mn<sup>2+</sup> on HPr.</title><p>The C-EDTA moiety is shown as sticks, with carbon atoms colored cyan. The rest of the HPr structure is shown as yellow cartoon. The Mn<sup>2+</sup> ions are shown as magenta spheres. (<bold>A</bold>) Three rotamers of HPr-E5C-EDTA-Mn<sup>2+</sup>. (<bold>B</bold>) Three rotamers of HPr-E32C-EDTA-Mn<sup>2+</sup>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.004">http://dx.doi.org/10.7554/eLife.01370.004</ext-link></p></caption><graphic xlink:href="elife01370fs001"/></fig></fig-group></p><p>Since the generated structures will be used for calculating PRE profiles to compare them to experimental PRE data (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>), two sets of docking calculations were performed using HPr structures that included the paramagnetic label EDTA-Mn<sup>2+</sup>, placed either at E5C, which is distal to the EIN/HPr interface in the native state, or at E32C, which is close to the edge of the interface (<xref ref-type="fig" rid="fig1">Figure 1A</xref>). Each C-EDTA-Mn<sup>2+</sup> label has three potential rotameric states, and hence Mn<sup>2+</sup> can occupy three different positions (<xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>). A separate docking was performed for each rotameric state of each EDTA-Mn<sup>2+</sup> probe. We retained the 10,000 lowest energy structures from each docking simulation, thus a total of 30,000 low energy structures for each of the two probes. These structures were then used for the analysis of encounter complexes and for the calculation of intermolecular PRE rates.</p><p><xref ref-type="fig" rid="fig1">Figure 1B</xref> shows the center of each low energy HPr structure, generated by the docking, as a small sphere, and indicates that these structures form three major clusters. <xref ref-type="fig" rid="fig1">Figure 1C</xref> shows the Interface Root Mean Square Deviation (IRMSD) from the native complex vs the PIPER energy score of the docked structures. For the calculation of IRMD we first select the interface residues of HPr that are within 10 Å of any EIN atom in the native complex. For each docked structure we than superimpose EIN onto EIN in the X-ray structure of the complex, and calculate the RMSD between the Cα atoms of the HPr interface residues in docked and native structures. The structures in the largest cluster (shown in blue in <xref ref-type="fig" rid="fig1">Figure 1B</xref>) overlap with the native state, with the lowest energy conformations being within 5 Å IRMSD from the native (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). The structures in this cluster, termed Class I, are the results of rigid body rotations and small translations around the native binding mode. Two representative Class I structures are shown in <xref ref-type="fig" rid="fig1">Figure 1D</xref>. Some Class I structures have less than 1 Å IRMSD, but the cluster extends as far as 15 Å IRMSD from the native. The two other clusters, termed Class II patch 1 and Class II patch 2, consist of structures that can coexist with the native complex. We note that while the three clusters clearly separate in the 3D representation shown in <xref ref-type="fig" rid="fig1">Figure 1B</xref>, they substantially overlap when projected into one dimension as a function of their IRMSD values. Nevertheless, <xref ref-type="fig" rid="fig1">Figure 1C</xref> shows at least three distinguishable energy minima. Class II patch 1 (magenta in <xref ref-type="fig" rid="fig1">Figure 1B</xref>) centers around a local energy minimum at around 17 Å IRMSD (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). <xref ref-type="fig" rid="fig1">Figure 1E</xref> shows two representative conformations for this patch. The third large cluster, Class II patch 2 (red in <xref ref-type="fig" rid="fig1">Figure 1B</xref>), is located on the opposite side of the Class I cluster, and is better seen after rotating the complex by 180° around its vertical axis (<xref ref-type="fig" rid="fig1">Figure 1F</xref>). The local energy minimum in this cluster is located at about 30 Å IRMSD from the native state. <xref ref-type="fig" rid="fig1">Figure 1G</xref> shows two representative conformations for the Class II patch 2. In addition to the complexes that belong to Class I and the two patches of Class II, there are a number of smaller patches, shown in pink in <xref ref-type="fig" rid="fig1">Figure 1B</xref>.</p></sec><sec id="s2-2"><title>PRE experiments and theoretical PRE profiles based on structure</title><p>To detect encounter complexes in the EIN/HPr system by PRE titration experiments, HPr was labeled with a paramagnetic EDTA-Mn<sup>2+</sup> moiety conjugated via a disulfide bond to surface cysteine mutations at specific sites (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>). We consider the mutations E5C and E32C that are both located outside the specific interaction surface with EIN (<xref ref-type="fig" rid="fig1">Figure 1A</xref>) and thus the labels do not interfere with the formation of the native complex. Intermolecular <sup>1</sup>H<sub>N</sub>−Γ<sub>2</sub> rates for the backbone amide protons of U-[<sup>2</sup>H,<sup>15</sup>N]-labeled EIN were measured in the presence of 150 mM NaCl to eliminate potential spurious nonspecific interactions not relevant at physiological ionic strength. PRE measurements were carried out at six different concentrations of the paramagnetically labeled HPr (ranging from 60 to 450 μM), corresponding to HPr:EIN molar ratios of 0.2–1.5. At each point in the titration, the intermolecular PREs were summed over their respective residues and normalized to the highest value of each titration curve. The data points in <xref ref-type="fig" rid="fig2">Figure 2</xref> show the normalized intermolecular PRE values and their standard errors observed in these titration experiments (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>).<fig-group><fig id="fig2" position="float"><object-id pub-id-type="doi">10.7554/eLife.01370.005</object-id><label>Figure 2.</label><caption><title>Normalized intermolecular PRE profiles for the EIN–HPr complex.</title><p>PRE measurements were carried out at 300 μM EIN, 300 μM HPr, and 150 mM NaCl (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>). Theoretical intermolecular PREs, calculated only from the coordinates of the specific EIN/HPr complex, are shown as black lines. Calculated PRE values, based on all generated encounter complexes, are shown as blue lines, and reveal substantial contributions by the non-specific structures. The experimental PRE rates (<italic>Γ</italic><sub>2</sub>) are displayed as filled-in magenta circles. Points representing <italic>Γ</italic><sub>2</sub> values that were too large (>60 s<sup>−1</sup>) to be determined accurately are placed at the saturation level <italic>Γ</italic><sub>2</sub>/<italic>Γ</italic><sub>2max</sub> = 1. Interface residues are indicated by red ticks on the x-axis. (<bold>A</bold>) Results for EIN/HPr-E5C-EDTA-Mn<sup>2+</sup> complexes. (<bold>B</bold>) Results for EIN/HPr-E32C-EDTA-Mn<sup>2+</sup> complexes.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.005">http://dx.doi.org/10.7554/eLife.01370.005</ext-link></p></caption><graphic xlink:href="elife01370f002"/></fig><fig id="fig2s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.006</object-id><label>Figure 2—figure supplement 1.</label><caption><title>Controls emphasizing the need for accurate energy function in docking: theoretical PRE profiles for the EIN/HPr complex, based on complexes generated by using only the van der Waals energy (blue line).</title><p>Theoretical intermolecular PREs, calculated from the coordinates of the specific EIN/HPr complex, are also shown as reference (black line). The experimental PRE rates (<italic>Γ</italic><sub>2</sub>) are displayed as filled-in magenta circles. (<bold>A</bold>) Results for EIN/HPr-E5C-EDTA-Mn<sup>2+</sup> compexes. (<bold>B</bold>) Results for EIN/HPr-E32C-EDTA-Mn<sup>2+</sup> complexes.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.006">http://dx.doi.org/10.7554/eLife.01370.006</ext-link></p></caption><graphic xlink:href="elife01370fs002"/></fig><fig id="fig2s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.007</object-id><label>Figure 2—figure supplement 2.</label><caption><title>Normalized intermolecular PRE profiles and encounter compexes for the IIA<sup>Mannitol</sup>/HPr interactions.</title><p>(<bold>A</bold>) Native structure of the complex formed by IIA<sup>Mannitol</sup> (grey) and HPr (yellow). The location of the paramagnetic tag, HPr-E5C-EDTA-Mn<sup>2+</sup>, is colored red and is indicated by a circle. The PDB ID of the complex is 1 J6T. (<bold>B</bold>) Centers of HPr structures, shown as blue spheres, in the encounter complex ensemble generated by the PIPER docking program. IIA<sup>Mannitol</sup>, shown as grey solid, is considered the receptor. The native binding pose of HPr is shown as yellow cartoon. (<bold>C</bold>) Theoretical intermolecular PRE profiles calculated from the coordinates of the native structure only (black line), and based on all encounter complexes generated by the docking (blue line). The experimental PRE rates (<italic>Γ</italic><sub>2</sub>) are displayed as filled-in magenta circles (<xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>). Points representing <italic>Γ</italic><sub>2</sub> values that were too large (>60 s<sup>−</sup>1) to be determined accurately are placed at the saturation level Γ<sub>2</sub>/Γ<sub>2max</sub> = 1. The interface residues of IIA<sup>Mannitol</sup> are indicated by red ticks on the x-axis.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.007">http://dx.doi.org/10.7554/eLife.01370.007</ext-link></p></caption><graphic xlink:href="elife01370fs003"/></fig><fig id="fig2s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.008</object-id><label>Figure 2—figure supplement 3.</label><caption><title>Normalized intermolecular PRE profiles and encounter compexes for the HPr/HPr interactions.</title><p>(<bold>A</bold>) Normalized intermolecular PRE profiles for the HPr/HPr complex. The theoretical intermolecular PREs profile, calculated from low energy encounter complexes, is shown as a green line. The experimental PRE rates (<italic>Γ</italic><sub><italic>2</italic></sub>) are displayed as filled-in magenta circles (<xref ref-type="bibr" rid="bib43">Tang et al., 2008</xref>). Points representing Γ<sub>2</sub> values that were too large (>60 s<sup>−</sup>1) to be determined accurately are placed at the saturation level Γ<sub>2</sub>/Γ<sub>2max</sub> = 1. Interface residues are indicated by red ticks on the x-axis. (<bold>B</bold>) Ensemble of low energy conformations of HPr/HPr interactions (<xref ref-type="bibr" rid="bib43">Tang et al., 2008</xref>). One of the two HPr molecules, considered he receptor, is shown as grey cartoon. The centers of the other HPr positions generated by the docking are shown as small blue spheres. These structures were used for back-calculating the theoretical PRE profile (green curve) shown in <bold>A</bold>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.008">http://dx.doi.org/10.7554/eLife.01370.008</ext-link></p></caption><graphic xlink:href="elife01370fs004"/></fig><fig id="fig2s4" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.009</object-id><label>Figure 2—figure supplement 4.</label><caption><title>Encounter complexes in the Cytochrome c–Cytochrome c peroxidase interactions as reported on the basis of PRE experiments (<xref ref-type="bibr" rid="bib1">Bashir et al., 2010</xref>), shown as pink spheres, and the ones generated by the PIPER docking program, shown as blue spheres.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.009">http://dx.doi.org/10.7554/eLife.01370.009</ext-link></p></caption><graphic xlink:href="elife01370fs005"/></fig></fig-group></p><p>Given the coordinates of a complex, one can back-calculate theoretical PRE profiles (‘Materials and methods’). As shown in <xref ref-type="fig" rid="fig2">Figure 2</xref>, the theoretical profile calculated from the coordinates in the X-ray structure of the native complex (black curve) substantially deviates from the experimental values for a number of residues. For HPr-E5C the largest differences occur at positions 59–97 and 160–167 of EIN, with smaller deviations at 23–37 and 183–189 (<xref ref-type="fig" rid="fig2">Figure 2A</xref>). For HPr-E32C the large differences are at positions 22–51, 56–74, 96–106, and 160–167 of EIN, with smaller differences at 184–189 (<xref ref-type="fig" rid="fig2">Figure 2B</xref>). These deviations show that the observed PRE rates cannot be explained well on the basis of the native binding mode of HPr alone, and provide at least qualitative evidence for the existence of lowly populated encounter states in rapid exchange with the final native complex (<xref ref-type="bibr" rid="bib43">Tang et al., 2008</xref>).</p><p>Our hypothesis is that the non-native structures generated by the docking represent encounter complexes, and hence accounting for these structures predicts the experimental PRE values better than the profile calculated only from the coordinates of the native complex. Therefore we calculate the theoretical PRE profiles based on all 30,000 low energy structures obtained by the docking for each position of the paramagnetic label (blue lines in <xref ref-type="fig" rid="fig2">Figure 2</xref>). The details of the calculation are given in the ‘Materials and methods’. We emphasize that these curves are based only on the docked structures, and the native binding mode in the X-ray structure of the complex is not used. The results show that the hypothesis is certainly true for EIN/HPr-E5C, because the full encounter ensemble provides much better approximation than the native complex, particularly for residues 59–97 and 160–167 (<xref ref-type="fig" rid="fig2">Figure 2A</xref>). The correlation coefficient between the experimental PRE rates and the ones based on the encounter complexes is 0.705. In contrast, the correlation coefficients between the experimental PRE rates and the ones back-calculated from the native structure (black line in <xref ref-type="fig" rid="fig2">Figure 2A</xref>) is only 0.47. We note that the agreement improves even for the interface residues in the 67–85 region of EIN (indicated by red ticks in <xref ref-type="fig" rid="fig2">Figure 2</xref>). The explanation is that the E5C-EDTA-Mn<sup>2+</sup> label is on the far side of HPr from the interface, and in some encounter complexes this label is much closer to interface residues than in the native complex. For HPr with the E32C-EDTA-Mn<sup>2+</sup> label, accounting for the encounter complexes generated by docking (blue curve in <xref ref-type="fig" rid="fig2">Figure 2B</xref>) improves the correlation coefficient more moderately, from 0.709 to 0.77. This is due to the fact that E32C is close to the edge of the interface in the native complex, already providing a strong PRE signal for residues 67–85, resulting in a high correlation coefficient with the experimental PRE values. As will be discussed, since the PRE data are sensitive to small conformational changes and thus are inherently noisy, it is difficult to further improve an already high correlation coefficient. However, even for HPr-E32C, the PRE profile back-calculated from the low energy models still yields better prediction than considering only the native binding mode. Since it is well known that the PRE profiles heavily depend on the location of the paramagnetic tag relative to the native interface (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>), this result does not contradict to our hypothesis that accounting for all structures generated by the docking improves the prediction of PRE rates.</p><p>To provide a control and to demonstrate that the use of an accurate energy function is very important for generating a meaningful ensemble of encounter complexes we have also performed docking calculations using a scoring function without long-range energy terms, that is, considering only the attractive and repulsive components of the van der Waals energy. This simplified energy function yields docked structures that have good shape complementarity, but have no favorable electrostatic or chemical interactions. The 30,000 structures with the lowest van der Waals energy from this ‘shape-complementarity only’ docking were then used for back-calculating theoretical PRE profiles. The results of these calculations, shown in <xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1</xref>, make it absolutely clear that the back-calculated PRE profiles based on the ensemble of structures generated without a proper energy function do not show any resemblance to the observed PRE data. In fact, both correlation coefficients between theoretical and experimental PRE rates are negative, −0.36 and −0.58, respectively, for the probes at positions E5C and E32C.</p><p>Considering encounter complexes generated by PIPER using its physics based energy function we also obtained good agreement with experimental PRE data for other pairs of proteins. The first is the IIA<sup>Mannitol</sup>/HPr complex (<xref ref-type="bibr" rid="bib12">Cornilescu et al., 2002</xref>; <xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>). <xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2,B</xref> show the native structure of the complex and the ensemble of docked structures generated by PIPER. The paramagnetic label is placed at E5C of HPr, colored red and indicated by a small circle in <xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2A</xref>. It is important that, similarly to the EIN/HPr system, the E5C-EDTA-Mn<sup>2+</sup> label is on the far side of HPr from the interface in the native structure of the complex<bold>.</bold> <xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2C</xref> shows the experimental PRE data, the theoretical PRE profile based on the native complex (black line), and the theoretical profile obtained by considering the 30,000 low energy structures generated by the docking (blue line). The correlation coefficient between the experimental PRE rates and the ones back-calculated from the native structure is 0.58, whereas using the docked structures for the PRE calculation increases the correlation coefficient to 0.78, demonstrating substantially improved prediction. Although some of the improvements occur at the interface residues, it is clearly helpful that the HPr-E5C-EDTA-Mn<sup>2+</sup> label is far from the interface. The distance between the label and a number of IIA<sup>Mannitol</sup> residues is substantially reduced in some of the encounter complexes, which makes the presence of minor species more pronounced. We also show observed PRE data and theoretical profiles calculated from the ensemble of structures generated by docking for the complexes HPr/HPr (<xref ref-type="bibr" rid="bib43">Tang et al., 2008</xref>; <xref ref-type="fig" rid="fig2s3">Figure 2—figure supplement 3</xref>), and cytochrome c/cytochrome c peroxidase (<xref ref-type="bibr" rid="bib1">Bashir et al., 2010</xref>) (<xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4</xref>), demonstrating good qualitative agreement in both cases.</p></sec><sec id="s2-3"><title>Energy landscapes of encounter complexes</title><p>Having established that the sampling algorithm and energy function are accurate enough for predicting ensembles of encounter complexes, we proceeded to the characterization of the energy landscape in a neighborhood of the native complex conformation. As in the previous section, we focused on the rigid-body motions of the ligand protein in the space fixed on the receptor protein, although local structural adjustments of the proteins were allowed for more accurate energy calculation. Geometrically the 6D translational/rotational space is the so-called Special Euclidean Group <italic>SE(3)</italic>, which is the semidirect product of <italic>R</italic><sup>3</sup> of the translations and <italic>SO(3)</italic> of the rotations (<xref ref-type="bibr" rid="bib32">Park, 1995</xref>; <xref ref-type="bibr" rid="bib33">Park and Ravani, 1997</xref>; <xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>; <xref ref-type="bibr" rid="bib30">Mirzaei et al., 2012</xref>). Restricting considerations to encounter complexes in which the surfaces of the two proteins touch each other removes the distance of the two proteins as a variable, and the space can be parameterized in terms of 5 angular coordinates. Two angles are needed to define the direction from the center of the receptor to the center of the ligand interface, and the other three angles specify the rotation of the ligand. Although the resulting space is nonlinear and thus the 5 angular coordinates are interdependent, a 5D Euclidean space can be mapped onto this nonlinear space using exponential maps (<xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>), and hence we will be able to use analysis tools such as PCA, developed for application in Euclidean space. Further details justifying the need for the use of exponential maps will be given in ‘Materials and methods’. Once an appropriate coordinate system was defined, we selected and densely sampled a region in the neighborhood of the native state to obtain information on the shape of the binding funnel (<xref ref-type="bibr" rid="bib5">Camacho et al., 1999</xref>; <xref ref-type="bibr" rid="bib36">Selzer and Schreiber, 2001</xref>; <xref ref-type="bibr" rid="bib49">Wang and Wade, 2003</xref>; <xref ref-type="bibr" rid="bib31">Miyashita et al., 2004</xref>). Since the apparent properties of the landscape depend both on the energy evaluation model and the method of sampling, to assess the generality of the results we used both PIPER (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>) and the very different docking program RosettaDock (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>), which is based on Monte Carlo minimization and rebuilds side chain conformations during the search. From each sampling calculation, performed either by PIPER or by RosettaDock, we selected the conformations below a certain energy threshold to delineate the floor of the energy funnel.</p><p>Encounter complexes were generated from unbound protein structures (<xref ref-type="bibr" rid="bib7">Chen et al., 2003</xref>) for a diverse set of 42 interacting protein pairs (<xref ref-type="table" rid="tbl1">Table 1</xref>). For each of these complexes, selected from the protein docking benchmark (<xref ref-type="bibr" rid="bib7">Chen et al., 2003</xref>), both PIPER and RosettaDock found an energy funnel near the native state. Since this is generally not the case for complexes involving multiple subunits or large conformational changes upon binding, such complexes in the benchmark set were not considered. Structures were retained within 10 Å IRMSD from the native state. After sampling, the exponential coordinates were normalized to ensure that the variances in the sample set are the same along each coordinate axis, and the shape of the energy landscape over the selected region was studied by applying principal component analysis (PCA) to 5% of conformations with the lowest energy values. As will be emphasized in ‘Materials and methods’, the use of exponential maps, resulting in independent coordinates, is crucial for the success of our study, as only in this case can PCA separate the essential hyperspaces that bound the low energy ensemble.<table-wrap id="tbl1" position="float"><object-id pub-id-type="doi">10.7554/eLife.01370.010</object-id><label>Table 1.</label><caption><p>Eigenvalues (in %) obtained by PCA, and the angle between restrictive subspaces</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.010">http://dx.doi.org/10.7554/eLife.01370.010</ext-link></p></caption><table frame="hsides" rules="groups"><thead><tr><th rowspan="2">PDB ID</th><th colspan="5">PIPER</th><th colspan="5">RosettaDock</th><th rowspan="2">Discrepancy (degrees)</th></tr><tr><th>λ<sub>1</sub></th><th>λ<sub>2</sub></th><th>λ<sub>3</sub></th><th>λ<sub>4</sub></th><th>λ<sub>5</sub></th><th>λ<sub>1</sub></th><th>λ<sub>2</sub></th><th>λ<sub>3</sub></th><th>λ<sub>4</sub></th><th>λ<sub>5</sub></th></tr></thead><tbody><tr><td>1AVX</td><td>59.4</td><td>32.8</td><td>6.2</td><td>1.2</td><td>0.3</td><td>67.4</td><td>15.5</td><td>13.4</td><td>3.4</td><td>0.3</td><td>5</td></tr><tr><td>1B6C</td><td>72.1</td><td>19.1</td><td>6.9</td><td>1.3</td><td>0.5</td><td>84.2</td><td>10.2</td><td>3.3</td><td>1.9</td><td>0.4</td><td>4</td></tr><tr><td>1 E6E</td><td>59.1</td><td>18.1</td><td>11.3</td><td>10.0</td><td>1.5</td><td>57.6</td><td>16.3</td><td>10.9</td><td>8.8</td><td>6.4</td><td>29</td></tr><tr><td>1EAW</td><td>44.3</td><td>31.7</td><td>22.2</td><td>1.0</td><td>0.9</td><td>57.9</td><td>33.0</td><td>4.6</td><td>4.0</td><td>0.4</td><td>25</td></tr><tr><td>1 E6J</td><td>78.7</td><td>13.5</td><td>7.1</td><td>0.3</td><td>0.3</td><td>47.6</td><td>31.5</td><td>18.7</td><td>1.2</td><td>1.0</td><td>16</td></tr><tr><td>1GLA</td><td>58.9</td><td>26.9</td><td>9.3</td><td>3.7</td><td>1.2</td><td>41.5</td><td>33.1</td><td>15.1</td><td>8.0</td><td>2.3</td><td>2</td></tr><tr><td>1IQD</td><td>74.7</td><td>13.5</td><td>7.8</td><td>3.6</td><td>0.4</td><td>58.0</td><td>26.7</td><td>12.7</td><td>1.9</td><td>0.7</td><td>13</td></tr><tr><td>1K74</td><td>47.8</td><td>28.0</td><td>19.0</td><td>3.6</td><td>1.5</td><td>61.0</td><td>22.0</td><td>10.5</td><td>5.2</td><td>1.2</td><td>19</td></tr><tr><td>1MAH</td><td>60.3</td><td>22.4</td><td>11.7</td><td>4.4</td><td>1.2</td><td>52.8</td><td>22.0</td><td>13.5</td><td>7.7</td><td>4.0</td><td>14</td></tr><tr><td>1N8O</td><td>56.1</td><td>23.4</td><td>13.3</td><td>6.4</td><td>0.9</td><td>66.9</td><td>22.3</td><td>10.3</td><td>0.3</td><td>0.2</td><td>20</td></tr><tr><td>1PPE</td><td>56.4</td><td>26.4</td><td>14.9</td><td>1.7</td><td>0.6</td><td>47.1</td><td>44.4</td><td>7.9</td><td>0.4</td><td>0.1</td><td>3</td></tr><tr><td>1PXV</td><td>68.3</td><td>17.0</td><td>9.6</td><td>4.3</td><td>0.8</td><td>32.1</td><td>27.2</td><td>23.6</td><td>14.5</td><td>2.7</td><td>8</td></tr><tr><td>1 R0R</td><td>55.0</td><td>26.8</td><td>15.3</td><td>2.7</td><td>0.2</td><td>69.3</td><td>20.2</td><td>6.7</td><td>3.0</td><td>0.9</td><td>13</td></tr><tr><td>2SNI</td><td>49.3</td><td>31.6</td><td>17.0</td><td>1.5</td><td>0.6</td><td>79.6</td><td>15.5</td><td>3.5</td><td>1.2</td><td>0.2</td><td>16</td></tr><tr><td>1KXQ</td><td>47.7</td><td>30.0</td><td>16.8</td><td>4.1</td><td>1.3</td><td>66.3</td><td>30.0</td><td>4.4</td><td>0.2</td><td>0.1</td><td>29</td></tr><tr><td>7CEI</td><td>44.7</td><td>28.5</td><td>20.9</td><td>4.6</td><td>1.3</td><td>47.7</td><td>27.9</td><td>18.9</td><td>3.6</td><td>1.9</td><td>19</td></tr><tr><td>2SIC</td><td>58.6</td><td>23.4</td><td>9.4</td><td>7.2</td><td>1.4</td><td>84.2</td><td>8.8</td><td>4.1</td><td>2.4</td><td>0.5</td><td>3</td></tr><tr><td>1AY7</td><td>56.9</td><td>20.3</td><td>15.0</td><td>5.4</td><td>2.4</td><td>42.1</td><td>32.5</td><td>12.6</td><td>9.2</td><td>3.7</td><td>27</td></tr><tr><td>1OPH</td><td>72.6</td><td>15.5</td><td>9.2</td><td>2.2</td><td>0.5</td><td>84.2</td><td>9.3</td><td>5.9</td><td>0.4</td><td>0.2</td><td>21</td></tr><tr><td>1UDI</td><td>64.6</td><td>18.6</td><td>12.6</td><td>2.4</td><td>1.8</td><td>51.2</td><td>27.1</td><td>14.2</td><td>6.4</td><td>1.1</td><td>33</td></tr><tr><td>1BUH</td><td>44.8</td><td>27.7</td><td>17.6</td><td>9.2</td><td>0.6</td><td>40.3</td><td>32.9</td><td>16.6</td><td>8.2</td><td>1.9</td><td>21</td></tr><tr><td>1FSK</td><td>45.0</td><td>28.0</td><td>22.1</td><td>3.5</td><td>1.4</td><td>42.6</td><td>29.7</td><td>19.9</td><td>5.8</td><td>1.9</td><td>21</td></tr><tr><td>1JPS</td><td>57.1</td><td>25.7</td><td>12.4</td><td>4.0</td><td>0.8</td><td>56.3</td><td>28.8</td><td>13.7</td><td>0.7</td><td>0.6</td><td>30</td></tr><tr><td>1DQJ</td><td>51.4</td><td>31.3</td><td>15.0</td><td>1.4</td><td>0.9</td><td>46.5</td><td>19.8</td><td>17.4</td><td>12.3</td><td>4.0</td><td>17</td></tr><tr><td>2B42</td><td>55.6</td><td>27.7</td><td>12.8</td><td>3.4</td><td>0.5</td><td>45.4</td><td>23.1</td><td>15.7</td><td>11.5</td><td>4.4</td><td>24</td></tr><tr><td>2FD6</td><td>65.1</td><td>18.1</td><td>9.9</td><td>4.6</td><td>2.2</td><td>36.4</td><td>23.9</td><td>21.0</td><td>13.7</td><td>5.0</td><td>20</td></tr><tr><td>2HQS</td><td>80.1</td><td>11.3</td><td>7.2</td><td>1.0</td><td>0.4</td><td>54.1</td><td>36.2</td><td>7.8</td><td>1.6</td><td>0.4</td><td>9</td></tr><tr><td>2I25</td><td>70.3</td><td>18.5</td><td>9.9</td><td>0.8</td><td>0.5</td><td>56.0</td><td>15.3</td><td>12.8</td><td>10.5</td><td>5.3</td><td>12</td></tr><tr><td>2MTA</td><td>45.8</td><td>26.1</td><td>20.5</td><td>5.2</td><td>2.5</td><td>45.5</td><td>32.2</td><td>12.2</td><td>7.4</td><td>2.7</td><td>30</td></tr><tr><td>1MLC</td><td>59.3</td><td>31.5</td><td>6.8</td><td>1.2</td><td>1.1</td><td>42.7</td><td>30.1</td><td>17.3</td><td>7.0</td><td>2.8</td><td>17</td></tr><tr><td>2HRK</td><td>57.7</td><td>31.0</td><td>9.7</td><td>0.9</td><td>0.7</td><td>61.2</td><td>16.4</td><td>10.5</td><td>8.6</td><td>3.3</td><td>30</td></tr><tr><td>1AHW</td><td>74.4</td><td>16.3</td><td>7.7</td><td>1.1</td><td>0.5</td><td>46.7</td><td>31.5</td><td>17.2</td><td>3.1</td><td>1.5</td><td>24</td></tr><tr><td>1Z5Y</td><td>66.1</td><td>18.0</td><td>8.9</td><td>5.4</td><td>1.5</td><td>57.1</td><td>32.3</td><td>9.7</td><td>0.6</td><td>0.4</td><td>29</td></tr><tr><td>2HLE</td><td>54.0</td><td>28.1</td><td>13.0</td><td>3.4</td><td>1.4</td><td>67.0</td><td>12.9</td><td>12.1</td><td>5.9</td><td>2.1</td><td>2</td></tr><tr><td>2NZ8</td><td>69.4</td><td>14.1</td><td>8.4</td><td>5.2</td><td>2.9</td><td>44.8</td><td>28.3</td><td>15.1</td><td>7.3</td><td>4.5</td><td>34</td></tr><tr><td>1BVN</td><td>61.4</td><td>20.3</td><td>14.3</td><td>3.6</td><td>0.4</td><td>37.2</td><td>28.5</td><td>17.8</td><td>10.0</td><td>6.5</td><td>32</td></tr><tr><td>1CGI</td><td>66.9</td><td>15.4</td><td>10.9</td><td>5.4</td><td>1.9</td><td>57.9</td><td>27.9</td><td>10.7</td><td>3.0</td><td>0.5</td><td>48</td></tr><tr><td>1GPW</td><td>53.8</td><td>20.9</td><td>14.2</td><td>6.4</td><td>4.7</td><td>46.5</td><td>26.5</td><td>17.9</td><td>5.0</td><td>4.0</td><td>27</td></tr><tr><td>2JEL</td><td>72.4</td><td>16.3</td><td>8.1</td><td>2.2</td><td>0.9</td><td>47.8</td><td>31.6</td><td>12.9</td><td>6.8</td><td>0.8</td><td>31</td></tr><tr><td>1NCA</td><td>76.7</td><td>18.8</td><td>3.0</td><td>1.2</td><td>0.4</td><td>55.9</td><td>24.3</td><td>15.6</td><td>3.2</td><td>1.0</td><td>27</td></tr><tr><td>2UUY</td><td>69.4</td><td>15.4</td><td>12.7</td><td>1.6</td><td>0.9</td><td>73.6</td><td>16.2</td><td>9.0</td><td>1.0</td><td>0.2</td><td>11</td></tr><tr><td>1KAC</td><td>48.9</td><td>34.6</td><td>13.3</td><td>2.0</td><td>1.2</td><td>53.8</td><td>19.5</td><td>15.6</td><td>6.8</td><td>4.2</td><td>30</td></tr></tbody></table></table-wrap></p><p>The eigenvalues obtained by PCA are normalized to add to 100%. Each eigenvalue <italic>λ</italic> <sub>i</sub> can be then interpreted as the percentage of the total variance that is accounted for by the variance along the corresponding eigenvector <bold><italic>v</italic></bold><sub>i</sub>. The smallest eigenvalue, <italic>λ</italic><sub>5</sub>, is less than 5% for almost all complexes (<xref ref-type="table" rid="tbl1">Table 1</xref>). In many cases both <italic>λ</italic><sub>5</sub> and <italic>λ</italic><sub>4</sub> are small (their sum is less than 10%), indicating that the eigenvectors <bold><italic>v</italic></bold><sub>4</sub> and <bold><italic>v</italic></bold><sub>5</sub> span a ‘restrictive’ subspace where the low energy structures barely deviate from the native complex. In contrast, <italic>λ</italic><sub>1</sub> and <italic>λ</italic><sub>2</sub> typically sum up to more than 75% of variance. Thus, it is expected that in the ‘permissive’ subspace spanned by <bold><italic>v</italic></bold><sub>1</sub> and <bold><italic>v</italic></bold><sub>2</sub> the low energy structures may substantially differ from the native conformation.</p><p>As an example, <xref ref-type="fig" rid="fig3">Figure 3A</xref> shows IRMSD and energy distributions along the five eigenvectors, calculated from the low energy structures generated by PIPER, for the complex between the retinoid X-receptor α (RXRα) and the peroxisome proliferator-activated receptor γ (PPARγ), considered here as the receptor and the ligand, respectively. The PDB entry of the complex is 1K74, but we docked the unbound (separately crystallized) RXRα and PPARγ structures rather than the components from the complex. <xref ref-type="fig" rid="fig3">Figure 3B</xref> shows the distributions of the same quantities, but based on the low energy structures generated by RosettaDock. The largest eigenvalue, <italic>λ</italic><sub>1</sub>, is close to 50% for both energy functions. The corresponding movements along <bold><italic>v</italic></bold><sub>1</sub> are rotations of helix H12 of PPARγ around a hydrophobic patch, formed by the side chains of F432, A433, and L436, which binds to a large hydrophobic pocket of RXRα and remains almost at the same position in all low energy encounter complexes (<xref ref-type="fig" rid="fig3">Figure 3C</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>; <xref ref-type="other" rid="video1">Video 1</xref>). As helix H12 rotates, the entire PPARγ moves with it until a loop formed by PPARγ residues 394 to 403 reaches a favorable position on the surface of RXRα. We note that hydrophobic patch on helix H12 and the residues connecting it to the rest of the protein (residues 413–433) are known to be essential for forming the heterodimer (<xref ref-type="bibr" rid="bib6">Chan and Wells, 2009</xref>). Along the eigenvector <bold><italic>v</italic></bold><sub>2</sub> that correspond to the second largest eigenvalue <italic>λ</italic><sub>2</sub> we can observe how the amino end of helix H12 with the hydrophobic patch on it moves into its binding pocket (<xref ref-type="other" rid="video2">Video 2</xref>). Based on the eigenvalues <italic>λ</italic><sub>1</sub> and <italic>λ</italic><sub>2</sub> (<xref ref-type="table" rid="tbl1">Table 1</xref>), over 75% of all movement of PPARγ approaching RXRα occurs in the subspace spanned by the eigenvectors <bold><italic>v</italic></bold><sub>1</sub> and <bold><italic>v</italic></bold><sub>2</sub>. Thus, this subspace can be regarded as the essential consensus of a very large number of association trajectories. In contrast to the permissive subspace, changes are very small along <bold><italic>v</italic></bold><sub>5</sub> (<xref ref-type="fig" rid="fig3">Figure 3D</xref>). Since the higher energy structures (not included in the data considered for PCA) can be substantially further from the native state than the ones with low energy, we conclude that the valley based on energy is much narrower than the valley based on geometry.<fig-group><fig id="fig3" position="float"><object-id pub-id-type="doi">10.7554/eLife.01370.011</object-id><label>Figure 3.</label><caption><title>Shape of the energy landscape along the five PCA eigenvectors for the complex of PPAR-γ and RXR-α (PDB code 1K74).</title><p>(<bold>A</bold>) Distributions of IRMSD (green) and energy (cyan) values based on structures generated by PIPER as functions of the ‘balanced’ coordinates shown on the x-axis. Dark blue diamonds indicate low energy data points used for the PCA. The IRMSD (y-axis in the left column) is given in Å. The energy values (on the y-axis in the right column) are given by the PIPER scoring function. (<bold>B</bold>) Same as <xref ref-type="fig" rid="fig3">Figure 3A</xref>, but based on structures generated by RosettaDock. The energy values (on the y-axis in the right column) are given by the RosettaDock scoring function. (<bold>C</bold>) Encounter complexes along the most permissive direction <bold><italic>v</italic></bold><sub>1</sub>. The ensemble includes mostly translations from the native state. (<bold>D</bold>) Encounter complexes along the most restrictive direction <bold><italic>v</italic></bold><sub>5</sub>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.011">http://dx.doi.org/10.7554/eLife.01370.011</ext-link></p></caption><graphic xlink:href="elife01370f003"/></fig><fig id="fig3s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.012</object-id><label>Figure 3—figure supplement 1.</label><caption><title>Helix H12 of PPARγ with residues of the hydrophobic patch indicated.</title><p>The receptor, RXRα, is shown in surface representation. Color code: oxygen red, nitrogen blue, and carbon white.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.012">http://dx.doi.org/10.7554/eLife.01370.012</ext-link></p></caption><graphic xlink:href="elife01370fs006"/></fig></fig-group><media content-type="glencoe play-in-place height-250 width-310" id="video1" mime-subtype="mp4" mimetype="video" xlink:href="elife01370v001.mp4"><object-id pub-id-type="doi">10.7554/eLife.01370.013</object-id><label>Video 1.</label><caption><title>Movement of PPARγ, shown as green cartoon, along the most permissive eigenvector v<sub>1</sub>.</title><p>The receptor, RXRα, is shown as grey surface.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.013">http://dx.doi.org/10.7554/eLife.01370.013</ext-link></p></caption></media><media content-type="glencoe play-in-place height-250 width-310" id="video2" mime-subtype="mp4" mimetype="video" xlink:href="elife01370v002.mp4"><object-id pub-id-type="doi">10.7554/eLife.01370.014</object-id><label>Video 2.</label><caption><title>Movement of PPARγ, shown as green cartoon, along the second most permissive eigenvector v<sub>2</sub>.</title><p>The receptor, RXRα, is shown as grey surface.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.014">http://dx.doi.org/10.7554/eLife.01370.014</ext-link></p></caption></media></p><p>As a second example, we show IRMSD and energy distributions and PCA results for an enzyme–inhibitor complex, subtilisin Carlsberg and its protein inhibitor, OMTKY3 (<xref ref-type="fig" rid="fig4">Figure 4</xref>). The PDB entry of the complex is 1R0R. For this pair of proteins, the low energy encounter complexes along the eigenvectors <bold><italic>v</italic></bold><sub>4</sub> and <bold><italic>v</italic></bold><sub>5</sub> show even narrower distributions than in the previous example, both for PIPER and RosettaDock (<xref ref-type="fig" rid="fig4">Figure 4A,B</xref>). Since the essentially planar inhibitor loop (residues 13 to 19 of OMTKY3) is locked into the crevice at the enzyme’s active site, we expected that the motion along the most permissive direction would be the rigid body rotation of the entire inhibitor, possibly with slight readjustments of the loop. However, we have found that the motion along <bold><italic>v</italic></bold><sub>1</sub> is the move of the loop, and particularly the primary specificity residue L18, deeper into the binding pocket of the enzyme (<xref ref-type="fig" rid="fig4">Figure 4C</xref>, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref>; <xref ref-type="other" rid="video3">Video 3</xref>). The rotation along the loop is also present, but along the eigenvector <bold><italic>v</italic></bold><sub>2</sub> rather than <bold><italic>v</italic></bold><sub>1</sub> (<xref ref-type="other" rid="video4">Video 4</xref>). Based on the eigenvectors <italic>λ</italic><sub>1</sub> and <italic>λ</italic><sub>2</sub> (<xref ref-type="table" rid="tbl1">Table 1</xref>), 81.8% of the movements of OMTKY3 upon binding occurs in the subspace spanned by eigenvectors <bold><italic>v</italic></bold><sub>1</sub> and <bold><italic>v</italic></bold><sub>2</sub> for this complex. In contrast, the motion along the most restrictive direction <bold><italic>v</italic></bold><sub>5</sub> is a very small translation along the bottom of the active site (<xref ref-type="fig" rid="fig4">Figure 4D</xref>). It is important to note that, in principle, small eigenvalues identified by PCA could have also occur by chance due to undersampling a subspace. We performed simple Monte Carlo analyses to exclude this possibility (‘Materials and methods’).<fig-group><fig id="fig4" position="float"><object-id pub-id-type="doi">10.7554/eLife.01370.015</object-id><label>Figure 4.</label><caption><title>Shape of the energy landscape along the five PCA eigenvectors for the complex of subtilisin Carlsberg and its protein inhibitor, OMTKY3.</title><p>All notations are as in <xref ref-type="fig" rid="fig3">Figure 3</xref>. (<bold>A</bold>) Distributions of interface IRMSD and energy values based on the structures generated by PIPER. (<bold>B</bold>) Same as <xref ref-type="fig" rid="fig4">Figure 4A</xref>, but based on the RosettaDock dataset. (<bold>C</bold>) Encounter complexes along the most permissive direction <bold><italic>v</italic></bold><sub>1</sub>. The ensemble consists of small rotations that leave the inhibitory loop position largely invariant. (<bold>D</bold>) Encounter complexes along the most restrictive direction <bold><italic>v</italic></bold><sub>5</sub>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.015">http://dx.doi.org/10.7554/eLife.01370.015</ext-link></p></caption><graphic xlink:href="elife01370f004"/></fig><fig id="fig4s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.01370.016</object-id><label>Figure 4—figure supplement 1.</label><caption><title>Movement of the OMTKY3 inhibitory loop into the active site of subtilisin Carlsberg.</title><p>Two snapshot of the motion are shown (in green and cyan) for residues 16 to 19 (CTLE), with L18 indicating the primary specificity residue.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.016">http://dx.doi.org/10.7554/eLife.01370.016</ext-link></p></caption><graphic xlink:href="elife01370fs007"/></fig></fig-group><media content-type="glencoe play-in-place height-250 width-310" id="video3" mime-subtype="mp4" mimetype="video" xlink:href="elife01370v003.mp4"><object-id pub-id-type="doi">10.7554/eLife.01370.017</object-id><label>Video 3.</label><caption><title>Movement of the protein inhibitor, OMTKY3, shown as green cartoon, along the most permissive eigenvector v<sub>1</sub>.</title><p>The receptor, subtilisin Carlsberg, is shown as grey surface.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.017">http://dx.doi.org/10.7554/eLife.01370.017</ext-link></p></caption></media><media content-type="glencoe play-in-place height-250 width-310" id="video4" mime-subtype="mp4" mimetype="video" xlink:href="elife01370v004.mp4"><object-id pub-id-type="doi">10.7554/eLife.01370.018</object-id><label>Video 4.</label><caption><title>Movement of the protein inhibitor, OMTKY3, shown as green cartoon, along the second most permissive eigenvector v<sub>2</sub>.</title><p>The receptor, subtilisin Carlsberg, is shown as grey surface.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.018">http://dx.doi.org/10.7554/eLife.01370.018</ext-link></p></caption></media></p><p>As shown by the eigenvalues in <xref ref-type="table" rid="tbl1">Table 1</xref> and by <xref ref-type="fig" rid="fig3 fig4">Figures 3 and 4</xref>, the energy funnels derived from the PCA of the energy landscapes generated by PIPER and RosettaDock slightly differ. This is not surprising, because we specifically selected two docking programs that are very different both in terms of their sampling algorithms and scoring functions (‘Materials and methods’). PIPER performs systematic rigid body sampling on a dense grid using a ‘smooth’ potential that allows for some overlaps (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>). In contrast, RosettaDock samples the region of interest using a Monte Carlo minimization algorithm, which biases the search toward low energy regions, and thus the sampling is less exhaustive than the systematic sampling by PIPER. The method periodically rebuilds the complete set of interface side chains, followed by the optimization of the rigid body displacement. The energy is locally minimized in every iteration cycle of a Monte Carlo search algorithm (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>), and since the clashes are continuously removed, RosettaDock can use an energy function that is more sensitive to small changes in the coordinates than the energy function used in PIPER. Accordingly, Panels A and B of <xref ref-type="fig" rid="fig3 fig4">Figures 3 and 4</xref> display somewhat different shapes of the energy distributions around the native state placed at the center of the coordinate system. Using rigid structures without local minimization, the minimum of the PIPER energy may be somewhat shifted from the native state, resulting in a more skewed energy landscape than the one obtained with RosettaDock, which generally places the energy minimum closer to the native structure and hence has a more symmetric energy landscape. In view of the differences between the two energy functions we consider it important that the PCA analyses of low energy structures generated by either PIPER or RosettaDock yield similar distributions of the eigenvalues for all 42 complexes. For each complex, both programs result in two small eigenvalues <italic>λ</italic><sub>5</sub> and <italic>λ</italic><sub>4</sub>. Although these eigenvalues are generally somewhat smaller for PIPER, because the rigid body approximation leads to a steeper increase in energy as we move away from the minimum along the most restrictive direction, both programs clearly indicate the existence of a restrictive subspace. In addition, Monte Carlo studies, described in the ‘Materials and methods’, show that the restrictive subspaces predicted PIPER and RosettaDock are fairly similar. The similarity of these subspaces obtained by two very different energy functions for all 42 complexes indicates that the reduction of dimensionality is an inherent property of protein–protein association. Both programs predict that, on the other end of the spectrum, the two largest eigenvalues, <italic>λ</italic><sub>1</sub> and <italic>λ</italic><sub>2</sub>, together exceed 75% of the total variance for most complexes. Thus, in a neighborhood of the native state the encounter complexes are essentially restricted to a two dimensional permissive subspace in the rotational/translational space, and this conclusion is independent of the docking program used.</p></sec></sec><sec id="s3" sec-type="discussion"><title>Discussion</title><sec id="s3-1"><title>Generation of encounter complexes by docking</title><p>Assuming moderate conformational changes and using grid approximation, the FFT based global and systematic sampling of the configurational space of two interacting proteins using a physics based energy function converts the docking problem into an exactly solvable problem of statistical mechanics (<xref ref-type="bibr" rid="bib23">Kozakov et al., 2013</xref>). According to the CAPRI community-wide protein–protein docking experiment, this type of approximation gives good results for a large fraction of complexes (<xref ref-type="bibr" rid="bib28">Lensink and Wodak, 2013</xref>). However, it has been well known that, for most protein pairs, such global search yields low energy structures in several regions of the conformational space, some of which are far from the structure of the native complex. Physics-based energy functions are expected to be globally valid for modeling interactions between proteins, including the non-native states. Thus, one can assume the energy values that are low relative to the average energy but still exceed the energy at the global minimum may lead to the formation of relatively short-lived encounter complexes along the association pathways. As shown in this paper, the agreement between experimental PRE data and theoretical PRE profiles calculated from the ensemble of structures generated by docking confirms this hypothesis, and thus structures of encounter complexes can be obtained simply as byproducts of docking without any further computational expense. While this result is not unexpected, in view of the limited structural information available on encounter complexes it is potentially significant.</p></sec><sec id="s3-2"><title>Identification of encounter complexes using PRE</title><p>To detect intermediate structures in the association of proteins EIN and HPr, paramagnetic labels were introduced at two sites on HPr, one at a time, and the transverse paramagnetic relaxation enhancement (PRE) rates, <italic>Γ</italic><sub>2</sub>, of the backbone amide protons (<sup>1</sup>H<sub>N</sub>) of EIN were measured. Since the population of the intermediate structures is generally much lower than the population of the native complex, it is important to discuss why PRE can detect the presence of encounter complexes. The major factor is that the magnitude of the PREs is proportional to < r<sup>−6</sup>>, where r is the distance between the nucleus of interest and the paramagnetic center, and <> denotes averaging over the ensemble of structures. Due to the large magnetic moment of an unpaired electron, the effect is detectable for sizeable separations (up to ∼34 Å for Mn<sup>2+</sup>). A hypothetical example can be used to explain why the method can detect states with very low populations. We consider an ensemble that includes a major species A with the population, <italic>p</italic><sub><italic>A</italic></sub>, of 99%, and with a paramagnetic center to proton distance of 30 Å, and a minor species B with the population, p<sub>B</sub>, of 1%, and with a paramagnetic center to proton distance of 8 Å. We calculate <italic>Γ</italic><sub>2</sub> for this proton in a two-site exchange system between A and B, where <italic>Γ</italic><sub>2</sub> is defined as the difference in the transverse relaxation rates of the paramagnetic and diamagnetic states (<xref ref-type="bibr" rid="bib19">Iwahara and Clore, 2006</xref>). For a ∼30-kDa complex, for species A the <sup>1</sup>H-<italic>Γ</italic><sub>2</sub> arising from Mn<sup>2+</sup> is ∼2 s<sup>−1</sup> (<italic>Γ</italic><sub>2,A</sub>), and for species B it is ∼5.6 × 10<sup>3</sup> s<sup>−1</sup> (<italic>Γ</italic><sub>2,B</sub>). Considering B as a short-lived encounter complex and A as the native state, and assuming that the system is in the fast exchange regime, the apparent PRE rate, <italic>Γ</italic><sub>2</sub>, is the population weighted average of the <italic>Γ</italic><sub>2</sub> rates of the two species, that is, <italic>Γ</italic><sub>2</sub> = <italic>p</italic><sub><italic>A</italic></sub> <italic>Γ</italic><sub>2,A</sub> + <italic>p</italic><sub><italic>B</italic></sub> <italic>Γ</italic><sub>2,B</sub> (<xref ref-type="bibr" rid="bib19">Iwahara and Clore, 2006</xref>). Based on this expression <italic>Γ</italic><sub>2</sub> is ∼30-fold larger than <italic>Γ</italic><sub>2,A</sub>, thereby permitting one to both infer the presence of, and obtain some structural information on, the minor species, because the PRE is a highly distance-dependent quantity. Thus, according to this simple explanation, the PREs can clearly capture the footprint of minor species that exchange rapidly with the native complex, in spite of their much lower concentration.</p><p>In a realistic protein–protein association the PRE rate, <italic>Γ</italic><sub>2</sub>, is the population weighted average of the <italic>Γ</italic><sub>2</sub> rates over the native state and the entire ensemble of encounter complexes. The strong distance dependence of <italic>Γ</italic><sub>2</sub> implies that the observed values are sensitive even to small conformational changes that may occur, for example, due to changes in the rotameric state of the EDTA-Mn<sup>2+</sup> paramagnetic probe. Thus, as shown in <xref ref-type="fig" rid="fig2">Figure 2</xref>, the PRE data, while sensitive to the presence of minor species, are also fairly noisy (‘Materials and methods’). In spite of their substantial variance, the data are informative, since PREs generally also occur at residues that are far from the paramagnetic label in the native complex but are getting closer to it in some members of the encounter ensemble, clearly indicating the presence of non-native transition states. As the examples studied in this paper show, the minor species can be better detected if the label is far from the interface. In fact, a label placed close to interface generates a strong PRE signal, and thus the PRE profile back-calculated from the native structure already correlates well with the data. However, accounting for the encounter complex ensemble most likely improves the prediction even in such cases, but the improvement is generally smaller than the one with the paramagnetic label placed far from the interface.</p></sec><sec id="s3-3"><title>Reduction of dimensionality in protein–protein association</title><p>The reduction of dimensionality in molecular association was originally proposed to explain high binding rates (<xref ref-type="bibr" rid="bib48">von Hippel and Berg, 1989</xref>), particularly the ability of proteins to locate their target sites along DNA (<xref ref-type="bibr" rid="bib34">Riggs et al., 1970</xref>). Dimensionality reduction is caused by interaction forces that are non-specific and thus do not lead to binding at a specific site, but keep the macromolecules in proximity for a prolonged time, allowing an extensive search of the surface along certain directions while restraining the search along others (<xref ref-type="bibr" rid="bib46">Ubbink, 2009</xref>). This is clearly the case for DNA, whose negative charge attracts positively charged proteins without providing a specific interaction site (<xref ref-type="bibr" rid="bib21">Iwahara et al., 2006</xref>; <xref ref-type="bibr" rid="bib16">Gorman and Greene, 2008</xref>). It is well known that long-range electrostatic interactions can also increase the rates of association of two proteins with net opposite charges or with strong charge dipoles, as the search for the reactive patches is facilitated by dipolar pre-orientation of the proteins upon their approach (<xref ref-type="bibr" rid="bib35">Schreiber et al., 2009</xref>). Such charge interactions prolong the lifetime of the transition state and increase the fraction of productive complexes, and thus can reduce dimensionality. However, it is frequently assumed that, due to specific charge–charge interactions and their irregular surface, proteins do not have ensembles of orientations having similar energies and thus allowing for search along the surface. We have shown here that this is definitely not the case because the energy landscape of interacting proteins, at least within the 10 Å IRMSD neighborhood of the native state, always includes a permissive subspace along which the conformation of the complex can substantially change without crossing significant energy barriers. Thus, there is no reason to assume that the interactions are nonspecific in protein-DNA association but are specific when two proteins associate. In fact, for all 42 protein pairs, some of which have strong electrostatic interactions, the energy landscape is smooth funnel in a two dimensional permissive subspace. In all cases this subspace captures at least 75% of the total motion as the two molecules approach the native state. For each of the 42 complexes we also detect a high energy subspace, which reduces the dimensionality of the space available to encounter complexes along the association pathways. Thus, there is much less difference between protein-DNA and protein–protein association than it was previously believed.</p><p>Finally we note that the reduced dimensionality of the search space can potentially simplify docking calculations, and thus the results of PCA provide several opportunities for improving the efficiency of docking methods. First, it is well known that any type of optimization is more efficient along the principal components, as large steps can be taken along the permissive directions. This is particularly the case for second-order methods such as the Newton–Raphson optimization that uses a local quadratic approximation of the energy function to find the next minimum in each iteration (<xref ref-type="bibr" rid="bib14">Fletcher, 1981</xref>). It is also important that such methods require the inversion of the Hessian matrix of the energy function, and in the case of reduced dimensionality the matrix is nearly singular, leading to numerical difficulties and loss of accuracy. Once such directions are known, the problem can be avoided by regularization methods (<xref ref-type="bibr" rid="bib14">Fletcher, 1981</xref>). In fact, after developing and testing a medium-range optimization method SDU, which employs quadratic semi-definite underestimation in the 5D angular space with the exponential parameters also used in this work (<xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>), we understood that the approach can be made more efficient by accounting for the reduced dimensionality of the search space and adding regularization based on PCA. Another potential use is optimally selecting perturbation vectors using the relative magnitudes of the eigenvalues in biased Monte Carlo methods (<xref ref-type="bibr" rid="bib27">Lee et al., 1996</xref>).</p></sec></sec><sec id="s4" sec-type="materials|methods"><title>Materials and methods</title><sec id="s4-1"><title>Global sampling by the Fast Fourier transform (FFT) correlation approach</title><p>In order to fully explore the conformational space in protein–protein association we perform exhaustive evaluation of an energy function in the discretized space of mutual orientations of the two proteins using the docking program PIPER, which is based on the Fast Fourier transform (FFT) correlation approach (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>). The center of mass of the first protein, defined here as the receptor, is fixed at the origin of the coordinate system, whereas the second protein (usually the smaller of the two), defined as the ligand, is rotated and translated. The translational space is represented as a grid of 1.0 Å displacements of the ligand center of mass, and the rotational space is sampled using 70,000 rotations based on a deterministic layered Sukharev grid sequence, which quasi-uniformly covers the space. The energy expression used for the FFT based sampling includes simplified van der Waals energy E<sub>vdw</sub> with attractive (E<sub>attr</sub>) and repulsive (E<sub>rep</sub>) contributions, the electrostatic interaction energy E<sub>elec</sub>, and a statistical pairwise potential Epair, representing other solvation effects (<xref ref-type="bibr" rid="bib8">Chuang et al., 2008</xref>):<disp-formula id="equ1"><mml:math id="m1"><mml:mrow><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>v</mml:mi><mml:mi>d</mml:mi><mml:mi>w</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mn>2</mml:mn></mml:msub><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>e</mml:mi><mml:mi>l</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mn>3</mml:mn></mml:msub><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>r</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></disp-formula></p><p>The individual energy terms are calculated by the <inline-formula><mml:math id="inf1"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>v</mml:mi><mml:mi>d</mml:mi><mml:mi>w</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>t</mml:mi><mml:mi>r</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mn>1</mml:mn></mml:msub><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>p</mml:mi></mml:mrow></mml:msub><mml:mtext>, </mml:mtext><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>e</mml:mi><mml:mi>l</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:msub><mml:mo>∑</mml:mo><mml:mi mathvariant="normal">i</mml:mi></mml:msub><mml:mrow><mml:mstyle displaystyle="true"><mml:msub><mml:mo>∑</mml:mo><mml:mi mathvariant="normal">j</mml:mi></mml:msub><mml:mrow><mml:mrow><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:mrow><mml:mrow><mml:msub><mml:mi>q</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>q</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mo>/</mml:mo><mml:mrow><mml:msup><mml:mrow><mml:mrow><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msup><mml:mi>D</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mtext> </mml:mtext><mml:mi>exp</mml:mi><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mrow><mml:mo>−</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mo>/</mml:mo><mml:mrow><mml:mn>4</mml:mn><mml:msup><mml:mi>D</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>/</mml:mo><mml:mn>2</mml:mn></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mrow></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:mrow></mml:math></inline-formula>, and <italic>E</italic><sub><italic>pair</italic></sub> <italic>=</italic> Σ<sub>i</sub> Σ<sub>j</sub> ε<sub>ij</sub>, where <italic>r</italic> is the distance between atoms <italic>i</italic> and <italic>j</italic>, <italic>D</italic> is an atom-type independent approximation of the generalized Born radius, and <italic>ε</italic><sub><italic>ij</italic></sub> is a pairwise interaction potential between atoms <italic>i</italic> and <italic>j</italic>. All energy expressions are defined on the grid. The coefficients <italic>w</italic><sub><italic>1</italic></sub> = 4, <italic>w</italic><sub><italic>2</italic></sub> = 600, <italic>w</italic><sub><italic>3</italic></sub> = 5, weight the different contributions to the scoring function, and are based on calorimetric considerations. In order to evaluate the energy function <italic>E</italic> by FFT, it must be written as a sum of correlation functions. The first two terms, <italic>E</italic><sub><italic>vdw</italic></sub> and <italic>E</italic><sub><italic>elec</italic></sub>, satisfy this condition, whereas <italic>E</italic><sub><italic>pair</italic></sub> is written as a sum of a few correlation functions, using an eigenvalue-eigenvector decomposition (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>). For each rotation, this expression can be efficiently calculated using <italic>P</italic> forward and one inverse Fast Fourier transforms. The calculations are performed for each of the 70,000 rotations, and one or several lowest energy translations for each rotation are retained. The results are clustered with a 10 Å IRMSD radius around the native coordinate.</p></sec><sec id="s4-2"><title>Generating encounter complexes</title><p>Unbound structures were used both for the receptor, EIN (chain A from PDB (<xref ref-type="bibr" rid="bib2">Berman et al., 2000</xref>) entry 1ZYM) and for the ligand, HPr (chain P from PDB entry 2JEL). Encounter complexes were generated using the global systematic Fast Fourier Transform based docking program PIPER (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>). The docking was performed with each of the three conformers of EDTA-Mn<sup>2+</sup> group, both at positions E5C and E32C of HPr (<xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>). For each conformer, the 10,000 lowest energy complex structures were retained for the calculation of PRE rates.</p></sec><sec id="s4-3"><title>Transverse paramagnetic relaxation enhancement (PRE) rate calculation</title><p>To calculate the transverse PRE rates (<italic>Γ</italic><sub>2</sub>) from the ensemble of encounter complexes generated by the FFT based sampling we use the <italic>N</italic><sub>st</sub> = 30,000 (10,000 for each of the three conformers of EDTA-Mn<sup>2+</sup>) lowest energy structures. The observed PRE values are the PRE rates averaged over a population (<xref ref-type="bibr" rid="bib20">Iwahara et al., 2004</xref>; <xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>), and hence<disp-formula id="equ2"><mml:math id="m2"><mml:mrow><mml:mo><</mml:mo><mml:msub><mml:mi>Γ</mml:mi><mml:mn>2</mml:mn></mml:msub><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi mathvariant="normal">i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>></mml:mo><mml:mo>=</mml:mo><mml:mrow><mml:mrow><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:msub><mml:mo>∑</mml:mo><mml:mi mathvariant="normal">j</mml:mi></mml:msub><mml:mrow><mml:msub><mml:mi>Γ</mml:mi><mml:mrow><mml:mi mathvariant="normal">ji</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mrow><mml:mo>/</mml:mo><mml:mrow><mml:msub><mml:mi mathvariant="normal">N</mml:mi><mml:mrow><mml:mi mathvariant="normal">st</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mrow></mml:mrow></mml:math></disp-formula>where <italic>Γ</italic><sub>ji</sub> is the PRE rate for residue <italic>i</italic> of the <italic>j</italic>th structure in the ensemble. Each individual <italic>Γ</italic><sub>ji</sub> value is proportional to the inverse sixth power of distance <italic>r</italic><sub>ij</sub> between the backbone amide proton (directly bonded to <sup>15</sup>N) of the <italic>i</italic>th residue and the paramagnetic ion Mn<sup>2+</sup>. To account for magnetic trap flexibility, we use the three state EDTA-Mn<sup>2+</sup> Solomon-Bloembergen approximation (<xref ref-type="bibr" rid="bib20">Iwahara et al., 2004</xref>; <xref ref-type="bibr" rid="bib44">Tang et al., 2006</xref>). With these assumptions the PRE rates are given by <italic>Γ</italic><sub>ji</sub> = <italic>C</italic> × <italic>Σ</italic><sub>k</sub> (<italic>r</italic><sub>ikj</sub>)<sup>−6</sup>, where <italic>C</italic> = 1.2 × 10<sup>10</sup> Å<sup>6</sup>/<italic>s</italic> and <italic>r</italic><sub>ikj</sub> is the distance between residue <italic>i</italic> and the <italic>k</italic>th state of EDTA-Mn<sup>2+</sup> in the <italic>j</italic>th structure in the low energy ensemble of docked configurations. The <italic>Γ</italic><sub>ji</sub> values are limited to 90s<sup>−1</sup>,that is, <italic>Γ</italic><sub>ji</sub> = 90 if <italic>Γ</italic><sub>ji</sub> ≥ 90. Introducing this threshold is based on the observation that both theoretical and experimental <italic>Γ</italic><sub>ji</sub> values become very uncertain over this threshold because small distance variations strongly affect the result (<xref ref-type="bibr" rid="bib22">Kim et al., 2008</xref>; <xref ref-type="bibr" rid="bib13">Fawzi et al., 2010</xref>).</p></sec><sec id="s4-4"><title>Sampling by Monte Carlo minimization</title><p>The free energy landscape near the native complex was explored using both PIPER, based on the Fast Fourier transform (FFT) correlation approach (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>) and RosettaDock, a docking program based on the Monte Carlo minimization (MCM) algorithm (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>). In each MCM cycle, RosettaDock perturbs the position of the ligand by random translations and rotations, followed by adjusting the distance between the ligand and receptor to create a contact. Next, a fast MCM at low resolution optimizes the complex orientation with respect to features that do not depend on the explicit conformations of the side chains. Finally, the side chains are added, and an all-atom optimization locates the local minimum energy conformation. The complete set of interface side chains is repacked every eight cycles, followed by the optimization the rigid body displacement. After each move, side chain packing, and minimization, an energy score is calculated. The new position is kept or rejected according to the standard Metropolis acceptance criterion (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>). RosettaDock uses a detailed energy function which includes van der Waals interactions with a linear term serving as the repulsive part, a solvation term based on a pairwise Gaussian solvent exclusion model, hydrogen bonding energies using an orientation-dependent empirical function, a rotamer probability term, residue–residue atom pair interactions for charged residues, and a simple electrostatic term across the protein–protein interface.</p></sec><sec id="s4-5"><title>Parameterizing the conformational space</title><p>The origin of the reference frame is placed at the center of the receptor, and the <italic>z</italic>-axis is directed toward the center of the interface of the native conformation. The translation of the ligand is described by the vector from the center of the receptor to the center of the ligand interface (as opposed to the center of the ligand), and the rotation of the ligand is also defined around the center of its interface. This choice is made to decouple, as much as possible, the effects of translation on the locations of the interface atoms from those of the rotation. A translation vector <bold><italic>y</italic></bold> ∈ <italic>R</italic><sup>3</sup> can be represented by a triplet (<italic>r,θ,φ</italic>), where <italic>r</italic> = <italic>||</italic><bold><italic>y</italic></bold><italic>||</italic> is the distance, <italic>θ</italic> is the azimuth angle between the projection of <bold><italic>y</italic></bold> on the <italic>xy</italic>-plane and the <italic>x</italic>-axis (longitude, 0 ≤ <italic>θ</italic> < 2π), and <italic>φ</italic> is the zenith angle between the <italic>z</italic>-axis and the vector <bold><italic>y</italic></bold> (colatitude, 0 ≤ <italic>φ</italic> < π). As will be discussed, we consider <italic>r</italic> separately, and focus on selecting appropriate parameterizations for <italic>(θ,φ</italic>) compounded with the rotational space <italic>SO(3).</italic></p><p>Parameterizing rotations is problematic because rotations are non-Euclidean in nature (i.e., travelling infinitely far in any direction will bring you back to your starting point an infinite number of times). Any attempt to parameterize the entire set of three degrees-of-freedom (DOF) rotations by an open subset of Euclidean space (as do Euler angles) will suffer from gimbal lock, the loss of rotational degrees of freedom, due to singularities in the parameter space (<xref ref-type="bibr" rid="bib17">Grassia, 1998</xref>). Parameterizations that are themselves defined over non-Euclidean spaces (such as the set of unit quaternions embedded in R<sup>4</sup>) may remain singularity-free, and thus avoid gimbal lock. Employing such parameterizations is complicated, however, since the numerical tools such as optimization and PCA assume Euclidean parameterizations; therefore we must either develop new tools whose domains are non-Euclidean, or complicate our systems by imposing explicit constraints, for example, to assure that the quaternions stay on the unit sphere (<xref ref-type="bibr" rid="bib17">Grassia, 1998</xref>). In this paper we use <italic>exponential maps</italic> (<xref ref-type="bibr" rid="bib32">Park, 1995</xref>; <xref ref-type="bibr" rid="bib33">Park and Ravani, 1997</xref>; <xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>) to project an Euclidean space onto the nonlinear rotational space. As an example, the simplest exponential map defines a local one-to-one correspondence between the unit circle, which is a nonlinear space (called the circle group), centered at 0 in the complex plane, and the tangent space at 1, which can be identified with the imaginary line in the complex plane. The exponential map for the circle group is given by <italic>it → e</italic><sup><italic>it</italic></sup>, where <italic>i</italic> = √(−1)<italic>, it</italic> specifies a point on the tangent line, and the exponential function projects it into the corresponding point of the circle (<xref ref-type="fig" rid="fig5">Figure 5A</xref>). Extending the map to three dimensions, the exponential map projecting the tangent plain of a 3D sphere onto the surface of the sphere is shown in <xref ref-type="fig" rid="fig5">Figure 5B</xref>.<fig id="fig5" position="float"><object-id pub-id-type="doi">10.7554/eLife.01370.019</object-id><label>Figure 5.</label><caption><title>Examples of simple exponential maps.</title><p>(<bold>A</bold>) Parameterization of the unit circle using an exponential map. The function <italic>e</italic><sup><italic>it</italic></sup> is a local one-to-one mapping of the tangent line around p = 1 onto the unit circle. (<bold>B</bold>) Prameterization of the 3D unit sphere using exponential parameters.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.01370.019">http://dx.doi.org/10.7554/eLife.01370.019</ext-link></p></caption><graphic xlink:href="elife01370f005"/></fig></p><p>For <italic>(θ,φ</italic>) the exponential coordinates are (<italic>σ</italic><sub>1</sub>,<italic>σ</italic><sub>2</sub>) = (-<italic>φ</italic> sin<italic>θ, φ</italic> cos<italic>θ</italic>). For <italic>SO(3),</italic> the exponential coordinates are <bold><italic>ω</italic></bold> = (<italic>ω</italic><sub><italic>1</italic></sub><italic>, ω</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>3</italic></sub>) ∈ <italic>R</italic><sup>3</sup>, where <italic>ω</italic><sub><italic>1</italic></sub><italic>, ω</italic><sub><italic>2</italic></sub>, and <italic>ω</italic><sub><italic>3</italic></sub> are elements of a skew-symmetric matrix (<xref ref-type="bibr" rid="bib32">Park, 1995</xref>; <xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>; <xref ref-type="bibr" rid="bib30">Mirzaei et al., 2012</xref>)<italic>.</italic> The vector (<italic>σ</italic><sub><italic>1</italic></sub><italic>, σ</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>1</italic></sub><italic>, ω</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>3</italic></sub>) defines the relative orientation of the two rigid proteins. Once this relative orientation is given, the binding distance <italic>r</italic> along the translation vector <bold><italic>y</italic></bold> (which connects the centers of the receptor with the center of the ligand’s interface) is determined by the assumptions that the two proteins are in contact but do not overlap (<xref ref-type="bibr" rid="bib37">Shen et al., 2008</xref>). Complexes generated by the docking methods used in this work always have this property. In particular, given a complex structure generated by the FFT sampling approach PIPER (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>), we can uniquely determine the corresponding (<italic>σ</italic><sub><italic>1</italic></sub><italic>, σ</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>1</italic></sub><italic>, ω</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>3</italic></sub>) coordinates and the value of <italic>r.</italic> Since RosettaDock (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>) generally changes the conformations of the component proteins, to isolate the rigid body motion we have to fit the initial protein structures to the complex and determine the closest rigid body transformation, projecting the higher dimensional motion into the rotational-translational space.</p><sec id="s4-5-1"><title>Sampling the near-native region and principal component analysis</title><p>We sample energy values in a sphere in the 5D parameter space around the point (0, 0, 0, 0, 0), which corresponds to the native conformation. Since we all five coordinates are angles, the radius of the sphere is also defined as an angle, and we used 22.5° as the radius, which roughly translates into a radius of 10 Å IRMSD neighborhood for relatively small proteins. After the FFT based sampling using the PIPER program (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>) we selected 5000 structures, uniformly distributed within this sphere. Conformations with more than 10 Å IRMSD from the native structure were discarded, resulting in about 4000 structures. RosettaDock (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>) was used to generate 2000 structures within the 10 Å IRMSD radius. After sampling we normalized the 5D coordinates to ensure that the variances in the sample set are the same along each coordinate axis, replacing each vector (<italic>σ</italic><sub><italic>1</italic></sub><italic>, σ</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>1</italic></sub><italic>, ω</italic><sub><italic>2</italic></sub><italic>, ω</italic><sub><italic>3</italic></sub>) with its normalized version (<italic>x</italic><sub><italic>1</italic></sub><italic>, x</italic><sub><italic>2</italic></sub><italic>, x</italic><sub><italic>3</italic></sub><italic>, x</italic><sub><italic>4</italic></sub><italic>, x</italic><sub><italic>5</italic></sub>). The use of such normalized coordinates removed the potential differences in the scaling of the initial angular parameters, and also rendered the results less dependent on the relative sizes of the two component proteins. For each of the two scoring functions, principal component analysis (PCA) was applied to the so-called ‘most favorable’ conformations whose energy values were below a certain threshold, for example, in the lowest 5% for the FFT-based sampling data. Let N denote the number of such favorable structures. The normalized coordinates (<italic>x</italic><sub><italic>1</italic></sub><italic>, x</italic><sub><italic>2</italic></sub><italic>, x</italic><sub><italic>3</italic></sub><italic>, x</italic><sub><italic>4</italic></sub><italic>, x</italic><sub><italic>5</italic></sub>) of the <italic>N</italic> structures were arranged into a <italic>N</italic>-by-5 matrix <bold>X</bold>, where each row represented a conformation. The PCA analysis computed the eigenvalues and eigenvectors of the covariance matrix</p><p><bold><italic>(X</italic></bold><italic>–μ</italic><sub><italic>X</italic></sub><bold><italic>)</italic></bold><italic>’</italic><bold><italic>(X</italic></bold><italic>–μ</italic><sub><italic>X</italic></sub><bold><italic>)</italic></bold>, where <italic>μ</italic><sub><italic>X</italic></sub> is the sample mean and prime denotes transpose. We sorted the eigenvalues in descending order and normalized them such that their sum equaled 1.0 (100%). The results were denoted by <italic>λ</italic><sub><italic>1</italic></sub><italic>,…, λ</italic><sub><italic>5</italic></sub>, and <bold><italic>v</italic></bold><sub><italic>1</italic></sub><italic>,…,</italic> <bold><italic>v</italic></bold><sub><italic>5</italic></sub> denote the corresponding eigenvectors, which are mutually orthogonal.</p></sec></sec><sec id="s4-6"><title>Further validation of the energy landscape</title><p>Since small eigenvalues identified by PCA might also occur by chance due to undersampling a subspace, we performed a simple Monte Carlo analysis to show that this is not the case. PCA was based on at least 100 low energy structures for each of the 42 complexes, and thence we generated 100 random vectors in the 5D space, applied PCA to derive the eigenvalues, and performed this experiment 1000 times. Results confirmed that the probability of λ<sub>5</sub> < 10% is less than 0.01. Thus, in view of the large number of sample points we used, it is very unlikely that the small eigenvalues shown in <xref ref-type="table" rid="tbl1">Table 1</xref> occur due to undersampling.</p><p>The PCA analyses of the 5D exponential coordinates of the low energy complex conformations show clear distinctions between permissive and restrictive directions in all 42 cases. The rigid FFT-based method (<xref ref-type="bibr" rid="bib24">Kozakov et al., 2006</xref>) and the Monte Carlo approach in RosettaDock (<xref ref-type="bibr" rid="bib18">Gray et al., 2003</xref>) yield similar results, in spite of the fact that two methods implement fundamentally different sampling and scoring schemes. To perform a rigorous comparison of the results from the two methods we introduce the notations <italic>λ</italic><sub>1P</sub>, . . . , <italic>λ</italic><sub>5P</sub> and <italic>λ</italic><sub>1R</sub>, . . . , <italic>λ</italic><sub>5R</sub> for the eigenvalues based on the low energy structures generated by, respectively, PIPER and RosettaDock. Both sets of eigenvalues are ordered in descending magnitude, and <bold><italic>v</italic></bold><sub>1P</sub>,...,<bold><italic>v</italic></bold><sub>5P</sub> and <bold><italic>v</italic></bold><sub>1R</sub>,...,<bold><italic>v</italic></bold><sub>5R</sub> denote the corresponding eigenvectors. Since our main goal is to show that the restrictive subspace is largely independent of the method used, as a measure of discrepancy we will determine the angle between the restrictive subspace spanned by eigenvectors <bold><italic>v</italic></bold><sub>4P</sub> and <bold><italic>v</italic></bold><sub>5P</sub> based on PIPER, and the subspace spanned by <bold><italic>v</italic></bold><sub>4R</sub> and <bold><italic>v</italic></bold><sub>5R</sub> based on RosettaDock. As shown in the last column of <xref ref-type="table" rid="tbl1">Table 1</xref>, this angle is less than or equals to 30° for all but 5 of the complexes. Accepting that the restrictive subspaces match if they differ by less than 30° seems to be a somewhat relaxed condition. However, it is easy to show by Monte Carlo simulations that the probability of such agreement by chance for 37 of the 42 structures is negligibly small. We applied PCA to two sets of 100 random vectors in 5D, calculated the covariance matrix and its eigenvalues, for each set we selected the subspace spanned by eigenvectors corresponding to the two smallest eigenvalues, and finally determined the angle between these two ‘restrictive’ subspaces. By repeating this calculation 1000 times we could show that the probability of obtaining an angle below 30° is p=0.131. Although this is not a very small number, the probability that this occurs for 37 of the 42 complexes is less than 10<sup>−22</sup>. Thus, the results overwhelmingly support the claim that the restrictive directions found by two very different methods are similar, and thus the reduction in dimensionality is an inherent property of protein–protein association. Due to the orthogonality of eigenvectors, the same similarity between PIPER and RosettaDock results also applies to the permissive subspaces spanned by the first 3 eigenvectors.</p><p>Additionally we provide Figures and Videos analogous to <xref ref-type="fig" rid="fig3 fig4">Figures 3,4</xref> and <xref ref-type="other" rid="video1 video2 video3 video4">Videos 1–4</xref> for all 42 complexes studied in this paper (<xref ref-type="bibr" rid="bib26">Kozakov et al., 2014</xref>).</p></sec></sec></body><back><sec sec-type="additional-information"><title>Additional information</title><fn-group content-type="competing-interest"><title>Competing interests</title><fn fn-type="conflict" id="conf1"><p>DK: Owns stock in Acpharis Inc which licensed FFT based sampling program PIPER for commerical use.</p></fn><fn fn-type="conflict" id="conf2"><p>DRH: Owns stock in Acpharis Inc which licensed FFT based sampling program PIPER for commerical use.</p></fn><fn fn-type="conflict" id="conf3"><p>DB: Owns stock in Acpharis Inc which licensed FFT based sampling program PIPER for commerical use.</p></fn><fn fn-type="conflict" id="conf4"><p>SV: Owns stock in Acpharis Inc which licensed FFT based sampling program PIPER for commerical use. However PIPER is free for academic and govermental research.</p></fn><fn fn-type="conflict" id="conf5"><p>The other authors declare that no competing interests exist.</p></fn></fn-group><fn-group content-type="author-contribution"><title>Author contributions</title><fn fn-type="con" id="con1"><p>DK, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con2"><p>KL, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con3"><p>DRH, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con4"><p>DB, Conception and design, Drafting or revising the article</p></fn><fn fn-type="con" id="con5"><p>PV, Conception and design, Drafting or revising the article</p></fn><fn fn-type="con" id="con6"><p>OS-F, Conception and design, Drafting or revising the article</p></fn><fn fn-type="con" id="con7"><p>ICP, Conception and design, Drafting or revising the article</p></fn><fn fn-type="con" id="con8"><p>GMC, Conception and design, Drafting or revising the article</p></fn><fn fn-type="con" id="con9"><p>JZ, Acquisition of data, Analysis and interpretation of data</p></fn><fn fn-type="con" id="con10"><p>SV, Conception and design, Analysis and interpretation of data, Drafting or revising the article</p></fn></fn-group></sec><sec sec-type="supplementary-material"><title>Additional files</title><sec sec-type="datasets"><title>Major datasets</title><p>The following dataset was generated:</p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro1"><name><surname>Kozakov</surname><given-names>D</given-names></name>, <name><surname>Li</surname><given-names>K</given-names></name>, <name><surname>Hall</surname><given-names>D</given-names></name>, <name><surname>Beglov</surname><given-names>D</given-names></name>, <name><surname>Zheng</surname><given-names>J</given-names></name>, <name><surname>Vakili</surname><given-names>P</given-names></name>, <name><surname>Schueler-Furman</surname><given-names>O</given-names></name>, <name><surname>Paschalidis</surname><given-names>I</given-names></name>, <name><surname>Clore</surname><given-names>G</given-names></name>, <name><surname>Vajda</surname><given-names>S</given-names></name>, <year>2014</year><x>, </x><source>Data from: Encounter complexes and dimensionality reduction in protein–protein association</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.5061/dryad.98n8c">10.5061/dryad.98n8c</ext-link><x>, </x><comment>Publicly available at Dryad (<ext-link ext-link-type="uri" xlink:href="http://datadryad.org/">http://datadryad.org/</ext-link>).</comment></related-object></p><p>The following previously published dataset was used:</p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro2"><name><surname>Hwang</surname><given-names>H</given-names></name>, <name><surname>Vreven</surname><given-names>T</given-names></name>, <name><surname>Chen</surname><given-names>R</given-names></name>, <name><surname>Mintseris</surname><given-names>J</given-names></name>, <name><surname>Janin</surname><given-names>J</given-names></name>, <name><surname>Weng</surname><given-names>Z</given-names></name>, <year>2012</year><x>, </x><source>Protein Docking Benchmark</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://zlab.umassmed.edu/zdock/benchmark.shtml">http://zlab.umassmed.edu/zdock/benchmark.shtml</ext-link><x>, </x><comment>Openly available at <ext-link ext-link-type="uri" xlink:href="http://zlab.umassmed.edu/zdock/benchmark.shtml">http://zlab.umassmed.edu/zdock/benchmark.shtml</ext-link>.</comment></related-object></p></sec></sec><ref-list><title>References</title><ref id="bib1"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bashir</surname><given-names>Q</given-names></name><name><surname>Volkov</surname><given-names>AN</given-names></name><name><surname>Ullmann</surname><given-names>GM</given-names></name><name><surname>Ubbink</surname><given-names>M</given-names></name></person-group><year>2010</year><article-title>Visualization of the encounter ensemble of the transient electron transfer complex of cytochrome c and cytochrome c peroxidase</article-title><source>Journal of the American Chemical Society</source><volume>132</volume><fpage>241</fpage><lpage>247</lpage><pub-id pub-id-type="doi">10.1021/Ja9064574</pub-id></element-citation></ref><ref id="bib2"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Berman</surname><given-names>HM</given-names></name><name><surname>Westbrook</surname><given-names>J</given-names></name><name><surname>Feng</surname><given-names>Z</given-names></name><name><surname>Gilliland</surname><given-names>G</given-names></name><name><surname>Bhat</surname><given-names>TN</given-names></name><name><surname>Weissig</surname><given-names>H</given-names></name><name><surname>Shindyalov</surname><given-names>IN</given-names></name><name><surname>Bourne</surname><given-names>PE</given-names></name></person-group><year>2000</year><article-title>The protein data bank</article-title><source>Nucleic Acids Research</source><volume>28</volume><fpage>235</fpage><lpage>242</lpage><pub-id pub-id-type="doi">10.1093/nar/28.1.235</pub-id></element-citation></ref><ref id="bib3"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Berg</surname><given-names>OG</given-names></name><name><surname>von Hippel</surname><given-names>PH</given-names></name></person-group><year>1985</year><article-title>Diffusion-controlled macromolecular interactions</article-title><source>Annual Review of Biophysics and Biophysical Chemistry</source><volume>14</volume><fpage>131</fpage><lpage>160</lpage><pub-id pub-id-type="doi">10.1146/annurev.bb.14.060185.001023</pub-id></element-citation></ref><ref id="bib4"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Camacho</surname><given-names>CJ</given-names></name><name><surname>Kimura</surname><given-names>SR</given-names></name><name><surname>DeLisi</surname><given-names>C</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2000</year><article-title>Kinetics of desolvation-mediated protein-protein binding</article-title><source>Biophysical Journal</source><volume>78</volume><fpage>1094</fpage><lpage>1105</lpage><pub-id pub-id-type="doi">10.1016/S0006-3495(00)76668-9</pub-id></element-citation></ref><ref id="bib5"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Camacho</surname><given-names>CJ</given-names></name><name><surname>Weng</surname><given-names>Z</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name><name><surname>DeLisi</surname><given-names>C</given-names></name></person-group><year>1999</year><article-title>Free energy landscapes of encounter complexes in protein-protein association</article-title><source>Biophysical Journal</source><volume>76</volume><fpage>1166</fpage><lpage>1178</lpage><pub-id pub-id-type="doi">10.1016/S0006-3495(99)77281-4</pub-id></element-citation></ref><ref id="bib6"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chan</surname><given-names>LSA</given-names></name><name><surname>Wells</surname><given-names>RA</given-names></name></person-group><year>2009</year><article-title>Cross-talk between PPARs and the partners of RXR: a molecular perspective</article-title><source>PPAR Research</source><volume>2009</volume><fpage>925309</fpage><pub-id pub-id-type="doi">10.1155/2009/925309</pub-id></element-citation></ref><ref id="bib7"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>R</given-names></name><name><surname>Mintseris</surname><given-names>J</given-names></name><name><surname>Janin</surname><given-names>J</given-names></name><name><surname>Weng</surname><given-names>Z</given-names></name></person-group><year>2003</year><article-title>A protein-protein docking benchmark</article-title><source>Proteins</source><volume>52</volume><fpage>88</fpage><lpage>91</lpage><pub-id pub-id-type="doi">10.1002/prot.10390</pub-id></element-citation></ref><ref id="bib8"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chuang</surname><given-names>GY</given-names></name><name><surname>Kozakov</surname><given-names>D</given-names></name><name><surname>Brenke</surname><given-names>R</given-names></name><name><surname>Comeau</surname><given-names>SR</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2008</year><article-title>DARS (Decoys as the reference state) potentials for protein-protein docking</article-title><source>Biophysical Journal</source><volume>95</volume><fpage>4217</fpage><lpage>4227</lpage><pub-id pub-id-type="doi">10.1529/biophysj.108.135814</pub-id></element-citation></ref><ref id="bib9"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2008</year><article-title>Visualizing lowly-populated regions of the free energy landscape of macromolecular complexes by paramagnetic relaxation enhancement</article-title><source>Molecular Biosystems</source><volume>4</volume><fpage>1058</fpage><lpage>1069</lpage><pub-id pub-id-type="doi">10.1039/B810232e</pub-id></element-citation></ref><ref id="bib10"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Clore</surname><given-names>GM</given-names></name><name><surname>Iwahara</surname><given-names>J</given-names></name></person-group><year>2009</year><article-title>Theory, practice, and applications of paramagnetic relaxation enhancement for the characterization of transient low-population states of biological macromolecules and their complexes</article-title><source>Chemical Reviews</source><volume>109</volume><fpage>4108</fpage><lpage>4139</lpage><pub-id pub-id-type="doi">10.1021/cr900033p</pub-id></element-citation></ref><ref id="bib11"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Comeau</surname><given-names>SR</given-names></name><name><surname>Kozakov</surname><given-names>D</given-names></name><name><surname>Brenke</surname><given-names>R</given-names></name><name><surname>Shen</surname><given-names>Y</given-names></name><name><surname>Beglov</surname><given-names>D</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2007</year><article-title>ClusPro: performance in CAPRI rounds 6-11 and the new server</article-title><source>Proteins</source><volume>69</volume><fpage>781</fpage><lpage>785</lpage><pub-id pub-id-type="doi">10.1002/prot.21795</pub-id></element-citation></ref><ref id="bib12"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cornilescu</surname><given-names>G</given-names></name><name><surname>Lee</surname><given-names>BR</given-names></name><name><surname>Cornilescu</surname><given-names>CC</given-names></name><name><surname>Wang</surname><given-names>GS</given-names></name><name><surname>Peterkofsky</surname><given-names>A</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2002</year><article-title>Solution structure of the phosphoryl transfer complex between the cytoplasmic A domain of the mannitol transporter IIMannitol and HPr of the <italic>Escherichia coli</italic> phoshotransferase system</article-title><source>The Journal Biological Chemistry</source><volume>277</volume><fpage>42289</fpage><lpage>42298</lpage><pub-id pub-id-type="doi">10.1074/Jbc.M207314200</pub-id></element-citation></ref><ref id="bib12a"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dill</surname><given-names>KA</given-names></name><name><surname>Chan</surname><given-names>HS</given-names></name></person-group><year>1997</year><article-title>From Levinthal to pathways to funnels</article-title><source>Nat Struct Biol</source><volume>4</volume><fpage>10</fpage><lpage>19</lpage><pub-id pub-id-type="doi">10.1038/nsb0197-10</pub-id></element-citation></ref><ref id="bib13"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fawzi</surname><given-names>NL</given-names></name><name><surname>Doucleff</surname><given-names>M</given-names></name><name><surname>Suh</surname><given-names>JY</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2010</year><article-title>Mechanistic details of a protein-protein association pathway revealed by paramagnetic relaxation enhancement titration measurements</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>107</volume><fpage>1379</fpage><lpage>1384</lpage><pub-id pub-id-type="doi">10.1073/pnas.0909370107</pub-id></element-citation></ref><ref id="bib14"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>Fletcher</surname><given-names>R</given-names></name></person-group><year>1981</year><article-title>Practical methods of optimization</article-title><publisher-loc>Chichester, England, NY</publisher-loc><publisher-name>J Wiley</publisher-name></element-citation></ref><ref id="bib15"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Garrett</surname><given-names>DS</given-names></name><name><surname>Seok</surname><given-names>YJ</given-names></name><name><surname>Peterkofsky</surname><given-names>A</given-names></name><name><surname>Gronenborn</surname><given-names>AM</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>1999</year><article-title>Solution structure of the 40,000 Mr phosphoryl transfer complex between the N-terminal domain of enzyme I and HPr</article-title><source>Nature Structural Biology</source><volume>6</volume><fpage>166</fpage><lpage>173</lpage><pub-id pub-id-type="doi">10.1038/5854</pub-id></element-citation></ref><ref id="bib16"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gorman</surname><given-names>J</given-names></name><name><surname>Greene</surname><given-names>EC</given-names></name></person-group><year>2008</year><article-title>Visualizing one-dimensional diffusion of proteins along DNA</article-title><source>Nature Structural & Molecular Biology</source><volume>15</volume><fpage>768</fpage><lpage>774</lpage><pub-id pub-id-type="doi">10.1038/Nsmb.1441</pub-id></element-citation></ref><ref id="bib17"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Grassia</surname><given-names>SF</given-names></name></person-group><year>1998</year><article-title>Practical parameterization of rotations using the exponential map</article-title><source>Journal of Graphics Tools</source><volume>3</volume><fpage>29</fpage><lpage>48</lpage><pub-id pub-id-type="doi">10.1080/10867651.1998.10487493</pub-id></element-citation></ref><ref id="bib18"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gray</surname><given-names>JJ</given-names></name><name><surname>Moughon</surname><given-names>S</given-names></name><name><surname>Wang</surname><given-names>C</given-names></name><name><surname>Schueler-Furman</surname><given-names>O</given-names></name><name><surname>Kuhlman</surname><given-names>B</given-names></name><name><surname>Rohl</surname><given-names>CA</given-names></name><name><surname>Baker</surname><given-names>D</given-names></name></person-group><year>2003</year><article-title>Protein-protein docking with simultaneous optimization of rigid-body displacement and side-chain conformations</article-title><source>Journal of Molecular Biology</source><volume>331</volume><fpage>281</fpage><lpage>299</lpage><pub-id pub-id-type="doi">10.1016/S0022-2836(03)00670-3</pub-id></element-citation></ref><ref id="bib19"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Iwahara</surname><given-names>J</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2006</year><article-title>Detecting transient intermediates in macromolecular binding by paramagnetic NMR</article-title><source>Nature</source><volume>440</volume><fpage>1227</fpage><lpage>1230</lpage><pub-id pub-id-type="doi">10.1038/nature04673</pub-id></element-citation></ref><ref id="bib20"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Iwahara</surname><given-names>J</given-names></name><name><surname>Schwieters</surname><given-names>CD</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2004</year><article-title>Characterization of nonspecific protein-DNA interactions by H-1 paramagnetic relaxation enhancement</article-title><source>Journal of the American Chemical Society</source><volume>126</volume><fpage>12800</fpage><lpage>12808</lpage><pub-id pub-id-type="doi">10.1021/Ja046246b</pub-id></element-citation></ref><ref id="bib21"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Iwahara</surname><given-names>J</given-names></name><name><surname>Zweckstetter</surname><given-names>M</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2006</year><article-title>NMR structural and kinetic characterization of a homeodomain diffusing and hopping on nonspecific DNA</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>103</volume><fpage>15062</fpage><lpage>15067</lpage><pub-id pub-id-type="doi">10.1073/Pnas.0605868103</pub-id></element-citation></ref><ref id="bib22"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname><given-names>YC</given-names></name><name><surname>Tang</surname><given-names>C</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name><name><surname>Hummer</surname><given-names>G</given-names></name></person-group><year>2008</year><article-title>Replica exchange simulations of transient encounter complexes in protein-protein association</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>105</volume><fpage>12855</fpage><lpage>12860</lpage><pub-id pub-id-type="doi">10.1073/pnas.0802460105</pub-id></element-citation></ref><ref id="bib23"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kozakov</surname><given-names>D</given-names></name><name><surname>Beglov</surname><given-names>D</given-names></name><name><surname>Bohnuud</surname><given-names>T</given-names></name><name><surname>Mottarella</surname><given-names>SE</given-names></name><name><surname>Xia</surname><given-names>B</given-names></name><name><surname>Hall</surname><given-names>DR</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2013</year><article-title>How good is automated protein docking?</article-title><source>Proteins</source><volume>81</volume><fpage>2159</fpage><lpage>2166</lpage><pub-id pub-id-type="doi">10.1002/Prot.24403</pub-id></element-citation></ref><ref id="bib24"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kozakov</surname><given-names>D</given-names></name><name><surname>Brenke</surname><given-names>R</given-names></name><name><surname>Comeau</surname><given-names>SR</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2006</year><article-title>PIPER: an FFT-based protein docking program with pairwise potentials</article-title><source>Proteins</source><volume>65</volume><fpage>392</fpage><lpage>406</lpage><pub-id pub-id-type="doi">10.1002/prot.21117</pub-id></element-citation></ref><ref id="bib25"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kozakov</surname><given-names>D</given-names></name><name><surname>Hall</surname><given-names>DR</given-names></name><name><surname>Beglov</surname><given-names>D</given-names></name><name><surname>Brenke</surname><given-names>R</given-names></name><name><surname>Comeau</surname><given-names>SR</given-names></name><name><surname>Shen</surname><given-names>Y</given-names></name><name><surname>Li</surname><given-names>K</given-names></name><name><surname>Zheng</surname><given-names>J</given-names></name><name><surname>Vakili</surname><given-names>P</given-names></name><name><surname>Paschalidis</surname><given-names>ICH</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2010</year><article-title>Achieving reliability and high accuracy in automated protein docking: clusPro, PIPER, SDU, and stability analysis in CAPRI rounds 13-19</article-title><source>Proteins</source><volume>78</volume><fpage>3124</fpage><lpage>3130</lpage><pub-id pub-id-type="doi">10.1002/prot.22835</pub-id></element-citation></ref><ref id="bib26"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kozakov</surname><given-names>D</given-names></name><name><surname>Li</surname><given-names>K</given-names></name><name><surname>Hall</surname><given-names>D</given-names></name><name><surname>Beglov</surname><given-names>D</given-names></name><name><surname>Zheng</surname><given-names>J</given-names></name><name><surname>Vakili</surname><given-names>P</given-names></name><name><surname>Schueler-Furman</surname><given-names>O</given-names></name><name><surname>Paschalidis</surname><given-names>I</given-names></name><name><surname>Clore</surname><given-names>G</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2014</year><article-title>Data from: Encounter complexes and dimensionality reduction in protein-protein association</article-title><source>Dryad</source><pub-id pub-id-type="doi">10.5061/dryad.98n8c</pub-id></element-citation></ref><ref id="bib27"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>B</given-names></name><name><surname>Kurochkina</surname><given-names>N</given-names></name><name><surname>Kang</surname><given-names>HS</given-names></name></person-group><year>1996</year><article-title>Protein folding by a biased Monte Carlo procedure in the dihedral angle space</article-title><source>FASEB Journal: Official Publication of the Federation of American Societies for Experimental Biology</source><volume>10</volume><fpage>119</fpage><lpage>125</lpage></element-citation></ref><ref id="bib28"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lensink</surname><given-names>MF</given-names></name><name><surname>Wodak</surname><given-names>SJ</given-names></name></person-group><year>2013</year><article-title>Docking, scoring, and affinity prediction in CAPRI</article-title><source>Proteins</source><volume>81</volume><fpage>2082</fpage><lpage>2095</lpage><pub-id pub-id-type="doi">10.1002/prot.24428</pub-id></element-citation></ref><ref id="bib29"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>McCammon</surname><given-names>JA</given-names></name></person-group><year>1998</year><article-title>Theory of biomolecular recognition</article-title><source>Current Opinion In Structural Biology</source><volume>8</volume><fpage>245</fpage><lpage>249</lpage><pub-id pub-id-type="doi">10.1016/S0959-440X(98)80046-8</pub-id></element-citation></ref><ref id="bib30"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mirzaei</surname><given-names>H</given-names></name><name><surname>Beglov</surname><given-names>D</given-names></name><name><surname>Paschalidis</surname><given-names>IC</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name><name><surname>Vakili</surname><given-names>P</given-names></name><name><surname>Kozakov</surname><given-names>D</given-names></name></person-group><year>2012</year><article-title>Rigid body energy minimization on manifolds for molecular docking</article-title><source>Journal of Chemical Theory and Computation</source><volume>8</volume><fpage>4374</fpage><lpage>4380</lpage><pub-id pub-id-type="doi">10.1021/ct300272j</pub-id></element-citation></ref><ref id="bib31"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miyashita</surname><given-names>O</given-names></name><name><surname>Onuchic</surname><given-names>JN</given-names></name><name><surname>Okamura</surname><given-names>MY</given-names></name></person-group><year>2004</year><article-title>Transition state and encounter complex for fast association of cytochrome c2 with bacterial reaction center</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>101</volume><fpage>16174</fpage><lpage>16179</lpage><pub-id pub-id-type="doi">10.1073/pnas.0405745101</pub-id></element-citation></ref><ref id="bib32"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Park</surname><given-names>FC</given-names></name></person-group><year>1995</year><article-title>Distance metrics on the rigid-body motions with applications to mechanism design</article-title><source>Journal of Mechanical Design</source><volume>117</volume><fpage>48</fpage><lpage>54</lpage><pub-id pub-id-type="doi">10.1115/1.2826116</pub-id></element-citation></ref><ref id="bib33"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Park</surname><given-names>FC</given-names></name><name><surname>Ravani</surname><given-names>B</given-names></name></person-group><year>1997</year><article-title>Smooth invariant interpolation of rotations</article-title><source>ACM Transactions on Graphic</source><volume>16</volume><fpage>277</fpage><lpage>295</lpage><pub-id pub-id-type="doi">10.1145/256157.256160</pub-id></element-citation></ref><ref id="bib34"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Riggs</surname><given-names>AD</given-names></name><name><surname>Bourgeoi</surname><given-names>S</given-names></name><name><surname>Cohn</surname><given-names>M</given-names></name></person-group><year>1970</year><article-title>Lac repressor-operator interaction. 3. Kinetic studies</article-title><source>Journal of Molecular Biology</source><volume>53</volume><fpage>401</fpage><lpage>417</lpage><pub-id pub-id-type="doi">10.1016/0022-2836(70)90074-4</pub-id></element-citation></ref><ref id="bib35"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schreiber</surname><given-names>G</given-names></name><name><surname>Haran</surname><given-names>G</given-names></name><name><surname>Zhou</surname><given-names>HX</given-names></name></person-group><year>2009</year><article-title>Fundamental aspects of protein-protein association kinetics</article-title><source>Chemical Reviews</source><volume>109</volume><fpage>839</fpage><lpage>860</lpage><pub-id pub-id-type="doi">10.1021/Cr800373w</pub-id></element-citation></ref><ref id="bib36"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Selzer</surname><given-names>T</given-names></name><name><surname>Schreiber</surname><given-names>G</given-names></name></person-group><year>2001</year><article-title>New insights into the mechanism of protein-protein association</article-title><source>Proteins Structure Function and Genetics</source><volume>45</volume><fpage>190</fpage><lpage>198</lpage><pub-id pub-id-type="doi">10.1002/Prot.1139</pub-id></element-citation></ref><ref id="bib37"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shen</surname><given-names>Y</given-names></name><name><surname>Paschalidis</surname><given-names>I</given-names></name><name><surname>Vakili</surname><given-names>P</given-names></name><name><surname>Vajda</surname><given-names>S</given-names></name></person-group><year>2008</year><article-title>Protein docking by the underestimation of free energy funnels in the space of encounter complexes</article-title><source>PLOS Computational Biology</source><volume>4</volume><fpage>e1000191</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1000191</pub-id></element-citation></ref><ref id="bib38"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shoemaker</surname><given-names>BA</given-names></name><name><surname>Portman</surname><given-names>JJ</given-names></name><name><surname>Wolynes</surname><given-names>PG</given-names></name></person-group><year>2000</year><article-title>Speeding molecular recognition by using the folding funnel: the fly-casting mechanism</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>97</volume><fpage>8868</fpage><lpage>8874</lpage><pub-id pub-id-type="doi">10.1073/Pnas.160259697</pub-id></element-citation></ref><ref id="bib39"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname><given-names>GR</given-names></name><name><surname>Sternberg</surname><given-names>MJ</given-names></name></person-group><year>2002</year><article-title>Prediction of protein-protein interactions by docking methods</article-title><source>Current Opinion In Structural Biology</source><volume>12</volume><fpage>28</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1016/S0959-440X(02)00285-3</pub-id></element-citation></ref><ref id="bib40"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Spaar</surname><given-names>A</given-names></name><name><surname>Helms</surname><given-names>V</given-names></name></person-group><year>2005</year><article-title>Free energy landscape of protein-protein encounter resulting from Brownian dynamics simulations of Barnase: Barstar</article-title><source>Journal of Chemical Theory and Computation</source><volume>1</volume><fpage>723</fpage><lpage>736</lpage><pub-id pub-id-type="doi">10.1021/Ct050036n</pub-id></element-citation></ref><ref id="bib41"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Suh</surname><given-names>JY</given-names></name><name><surname>Cai</surname><given-names>ML</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2008</year><article-title>Impact of phosphorylation on structure and thermodynamics of the interaction between the N-terminal domain of enzyme I and the histidine phosphocarrier protein of the bacterial phosphotransferase system</article-title><source>The Journal of Biological Chemistry</source><volume>283</volume><fpage>18980</fpage><lpage>18989</lpage><pub-id pub-id-type="doi">10.1074/Jbc.M802211200</pub-id></element-citation></ref><ref id="bib42"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Suh</surname><given-names>JY</given-names></name><name><surname>Tang</surname><given-names>C</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2007</year><article-title>Role of electrostatic interactions in transient encounter complexes in protein-protein association investigated by paramagnetic relaxation enhancement</article-title><source>Journal of the American Chemical Society</source><volume>129</volume><fpage>12954</fpage><lpage>12960</lpage><pub-id pub-id-type="doi">10.1021/Ja0760978</pub-id></element-citation></ref><ref id="bib43"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname><given-names>C</given-names></name><name><surname>Ghirlando</surname><given-names>R</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2008</year><article-title>Visualization of transient ultra-weak protein self-association in solution using paramagnetic relaxation enhancement</article-title><source>Journal of the American Chemical Society</source><volume>130</volume><fpage>4048</fpage><lpage>4056</lpage><pub-id pub-id-type="doi">10.1021/Ja710493m</pub-id></element-citation></ref><ref id="bib44"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname><given-names>C</given-names></name><name><surname>Iwahara</surname><given-names>J</given-names></name><name><surname>Clore</surname><given-names>GM</given-names></name></person-group><year>2006</year><article-title>Visualization of transient encounter complexes in protein-protein association</article-title><source>Nature</source><volume>444</volume><fpage>383</fpage><lpage>386</lpage><pub-id pub-id-type="doi">10.1038/Nature05201</pub-id></element-citation></ref><ref id="bib45"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tovchigrechko</surname><given-names>A</given-names></name><name><surname>Vakser</surname><given-names>IA</given-names></name></person-group><year>2001</year><article-title>How common is the funnel-like energy landscape in protein-protein interactions?</article-title><source>Protein Science</source><volume>10</volume><fpage>1572</fpage><lpage>1583</lpage><pub-id pub-id-type="doi">10.1110/Ps.8701</pub-id></element-citation></ref><ref id="bib46"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ubbink</surname><given-names>M</given-names></name></person-group><year>2009</year><article-title>The courtship of proteins: understanding the encounter complex</article-title><source>FEBS Letters</source><volume>583</volume><fpage>1060</fpage><lpage>1066</lpage><pub-id pub-id-type="doi">10.1016/j.febslet.2009.02.046</pub-id></element-citation></ref><ref id="bib47"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vajda</surname><given-names>S</given-names></name><name><surname>Kozakov</surname><given-names>D</given-names></name></person-group><year>2009</year><article-title>Convergence and combination of methods in protein-protein docking</article-title><source>Current Opinion In Structural Biology</source><volume>19</volume><fpage>164</fpage><lpage>170</lpage><pub-id pub-id-type="doi">10.1016/j.sbi.2009.02.008</pub-id></element-citation></ref><ref id="bib48"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>von Hippel</surname><given-names>PH</given-names></name><name><surname>Berg</surname><given-names>OG</given-names></name></person-group><year>1989</year><article-title>Facilitated target location in biological systems</article-title><source>The Journal of Biological Chemistry</source><volume>264</volume><fpage>675</fpage><lpage>678</lpage></element-citation></ref><ref id="bib49"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>T</given-names></name><name><surname>Wade</surname><given-names>RC</given-names></name></person-group><year>2003</year><article-title>Implicit solvent models for flexible protein-protein docking by molecular dynamics simulation</article-title><source>Proteins</source><volume>50</volume><fpage>158</fpage><lpage>169</lpage><pub-id pub-id-type="doi">10.1002/prot.10248</pub-id></element-citation></ref><ref id="bib50"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>C</given-names></name><name><surname>Chen</surname><given-names>J</given-names></name><name><surname>DeLisi</surname><given-names>C</given-names></name></person-group><year>1999</year><article-title>Protein-protein recognition: exploring the energy funnels near the binding sites</article-title><source>Proteins</source><volume>34</volume><fpage>255</fpage><lpage>267</lpage><pub-id pub-id-type="doi">10.1002/(SICI)1097-0134(19990201)34:2<255::AID-PROT10>3.0.CO;2-O</pub-id></element-citation></ref><ref id="bib51"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname><given-names>WH</given-names></name><name><surname>Schafer</surname><given-names>NP</given-names></name><name><surname>Davtyan</surname><given-names>A</given-names></name><name><surname>Papoian</surname><given-names>GA</given-names></name><name><surname>Wolynes</surname><given-names>PG</given-names></name></person-group><year>2012</year><article-title>Predictive energy landscapes for protein-protein association</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>109</volume><fpage>19244</fpage><lpage>19249</lpage><pub-id pub-id-type="doi">10.1073/Pnas.1216215109</pub-id></element-citation></ref></ref-list></back><sub-article article-type="article-commentary" id="SA1"><front-stub><article-id pub-id-type="doi">10.7554/eLife.01370.020</article-id><title-group><article-title>Decision letter</article-title></title-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Roux</surname><given-names>Benoit</given-names></name><role>Reviewing editor</role><aff><institution>University of Chicago</institution>, <country>United States</country></aff></contrib></contrib-group></front-stub><body><boxed-text><p>eLife posts the editorial decision letter and author response on a selection of the published articles (subject to the approval of the authors). An edited version of the letter sent to the authors after peer review is shown, indicating the substantive concerns or comments; minor concerns are not usually shown. Reviewers have the opportunity to discuss the decision before the letter is sent (see <ext-link ext-link-type="uri" xlink:href="http://elifesciences.org/review-process">review process</ext-link>). Similarly, the author response typically shows only responses to the major concerns raised by the reviewers.</p></boxed-text><p>Thank you for sending your work entitled “Encounter Complexes and Dimensionality Reduction in Protein-Protein Association” for consideration at <italic>eLife</italic>. Your article has been evaluated by a Senior editor (John Kuriyan), a member of our Board of Reviewing Editors, and 2 reviewers. The comments were then further discussed and a consensus was determined. Prior reaching a final decision about the manuscript, we need to consider your response to address the following substantial issue that emerged from those discussions:</p><p>Docking calculations were used to thoroughly sample association modes between two proteins and identify ensembles of low energy poses. These ensembles were then used to back calculate paramagnetic relaxation enhancement (PRE) profiles, which were then compared to those derived from experimental PRE measures by NMR. The results presented show that sampling by docking is consistent with the encounters measured experimentally by PRE. The novelty of this study lies with comparing the docking ensembles with ensembles derived from PRE experiments, and using the agreement with experimentally measured PRE as a means to establish the legitimacy of the docking ensembles as representing encounter complexes. Yet little attention is devoted to the PRE data themselves and how they can be related to docking poses and their energetics. How noisy are these data? How much slack is there in associating a given binding mode with a PRE signal. While this study may be the first time the funnel-like shape for the docking reaction coordinate has (some) experimental support, one should be cautious as the funnel shape is deduced from the docking calculations only. Until we understand the limitations of the PRE data it is hard to tell if they support the funnel shape. If indeed the main conclusion of the paper is that the funnel shape is supported by PRE experiments, then more must be provided about the experimental method, the uncertainty in the experimental data, and the sensitivity of the comparison between the docking results and the experiments.</p><p>Specific points to be addressed are:</p><p>1) A serious omission is the failure to include an important control where PRE back calculations are performed from docking poses with randomized energies. Would computed PRE profiles from these randomized ensembles look very different from those derived from the docking ensembles and/or experiment?</p><p>2) The Mn<sup>2+</sup> probe appears to be located in only a few sites on each protein. It would be useful to show schematically where these sites actually are in <xref ref-type="fig" rid="fig2 fig3 fig4">Figures 2, 3, and 4</xref>. The authors should confirm that the Mn<sup>2+</sup> probes really were located at E5 and E32 (it is implied but not stated), and exactly which nitrogens were labelled with <sup>15</sup>N (was it all amide nitrogens)?] In this regard it would have been extremely informative to provide a more detailed description of how PRE profiles are back calculated from association modes and their energy levels, and to discuss the inherent error rate in the experimental PRE signal itself: How does the fact that PRE is 'a technique extremely sensitive to the presence of lowly populated states...' translate in practical terms? Some of these issues are succinctly mentioned in the Introduction but not fully addressed.</p></body></sub-article><sub-article article-type="reply" id="SA2"><front-stub><article-id pub-id-type="doi">10.7554/eLife.01370.021</article-id><title-group><article-title>Author response</article-title></title-group></front-stub><body><p><italic>The novelty of this study lies with comparing the docking ensembles with ensembles derived from PRE experiments, and using the agreement with experimentally measured PRE as a means to establish the legitimacy of the docking ensembles as representing encounter complexes. Yet little attention is devoted to the PRE data themselves and how they can be related to docking poses and their energetics. How noisy are these data? How much slack is there in associating a given binding mode with a PRE signal. While this study may be the first time the funnel-like shape for the docking reaction coordinate has (some) experimental support, one should be cautious as the funnel shape is deduced from the docking calculations only. Until we understand the limitations of the PRE data it is hard to tell if they support the funnel shape. If indeed the main conclusion of the paper is that the funnel shape is supported by PRE experiments, then more must be provided about the experimental method, the uncertainty in the experimental data, and the sensitivity of the comparison between the docking results and the experiments</italic>.</p><p>We have made three main changes to address the above general criticism as follows: 1) In the Results section we added a new subsection entitled “PRE experiments and theoretical PRE profiles based on structure”. In this subsection we provide more information on the paramagnetic relaxation enhancement (PRE) experiment and its implications (see our response to the specific comments below).</p><p>2) <xref ref-type="fig" rid="fig2">Figure 2</xref> now includes the error bars of the experimental PRE data points.</p><p>3) We added a new section to the Discussion, “Identification of encounter complexes using PRE”. In this section we first provide an example explaining why PRE data are capable of indicating the presence of transition states, in spite of their low population. Second, we show that although the PRE data are inherently noisy due to the strong distance dependence, they still can unambiguously reveal if minor species are present.</p><p><italic>Specific points to be addressed</italic> <italic>are</italic>:</p><p><italic>1) A serious omission is the failure to include an important control where PRE back calculations are performed from docking poses with randomized energies. Would computed PRE profiles from these randomized ensembles look very different from those derived from the</italic> <italic>docking ensembles and/or experiment</italic>?</p><p>We thank the reviewers for suggesting this control experiment. We have followed the advice, and to demonstrate the importance of the energy function when generating the encounter complexes performed docking calculations using a scoring function without long-range energy terms, i.e., considering only the attractive and repulsive components of the van der Waals energy. This simplified energy function yields docked structures that have good shape complementarity, but have no favorable electrostatic or chemical interactions (fourth paragraph of the Results section entitled “PRE experiments and theoretical PRE profiles based on structure”). The 30,000 structures with the lowest van der Waals energy from this “shape-complementarity only” docking were then used for back-calculating theoretical PRE profiles. The results of these calculations, shown in the new <xref ref-type="fig" rid="fig2s1">Figure 2–figure supplement 1</xref>, make absolutely clear the PRE rates based on the ensemble of structures generated without a proper energy function do not show any resemblance to the observed PRE data. We also show that the correlation coefficients between the experimental PRE rates and the theoretical PRE profiles based on these docked structures are negative. We think that these control calculations convincingly show the need for using a meaningful physics based energy function in order to predict the observed PRE data.</p><p><italic>2) The Mn</italic><sup><italic>2+</italic></sup> <italic>probe appears to be located in only a few sites on each protein. It would be useful to show schematically where these sites actually are in</italic> <xref ref-type="fig" rid="fig2 fig3 fig4">Figures 2, 3, and 4</xref><italic>. The authors should confirm that the Mn</italic><sup><italic>2+</italic></sup> <italic>probes really were located at E5 and E32 (it is implied but not stated), and exactly which nitrogens were labelled with</italic> <sup>15</sup><italic>N (was it all amide nitrogens)?] In this regard it would have been extremely informative to provide a more detailed description of how PRE profiles are back calculated from association modes and their energy levels, and to discuss the inherent error rate in the experimental PRE signal itself: How does the fact that PRE is 'a technique extremely sensitive to the presence of lowly populated states...' translate in practical terms? Some of these issues are succinctly mentioned in the Introduction but not fully addressed</italic>.</p><p>In two new subsections added to the revised manuscript we address the above points as follows:</p><p>A) The subsection “PRE experiments and theoretical PRE profiles based on structure” in the Results provides a more detailed description of the PRE titration experiment than in the original submission, and hopefully clarifies the issues raised by the reviewers.</p><p>B) In the subsection “Identification of encounter complexes using PRE” (Discussion) we (1) discuss the sources of errors in the PRE data; (2) show that due to its strong distance dependence, PRE is extremely sensitive to the presence of lowly populated states; and (3) explain that although the method is inherently noisy due to the strong distance dependence, it unambiguously reveals if minor species are present.</p></body></sub-article></article> |