<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="en">
  <front>
    <journal-meta>
      <journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
      <journal-id journal-id-type="publisher-id">plos</journal-id>
      <journal-id journal-id-type="pmc">plosone</journal-id>
      <journal-title-group>
        <journal-title>PLoS ONE</journal-title>
      </journal-title-group>
      <issn pub-type="epub">1932-6203</issn>
      <publisher>
        <publisher-name>Public Library of Science</publisher-name>
        <publisher-loc>San Francisco, USA</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">PONE-D-12-22198</article-id>
      <article-id pub-id-type="doi">10.1371/journal.pone.0052505</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Research Article</subject>
        </subj-group>
        <subj-group subj-group-type="Discipline-v2">
          <subject>Biology</subject>
          <subj-group>
            <subject>Biochemistry</subject>
            <subj-group>
              <subject>Biomacromolecule-ligand interactions</subject>
              <subject>Enzymes</subject>
              <subject>Proteins</subject>
            </subj-group>
          </subj-group>
          <subj-group>
            <subject>Biophysics</subject>
            <subj-group>
              <subject>Biomacromolecule-ligand interactions</subject>
              <subject>Biophysics simulations</subject>
            </subj-group>
          </subj-group>
          <subj-group>
            <subject>Computational biology</subject>
            <subj-group>
              <subject>Macromolecular structure analysis</subject>
              <subj-group>
                <subject>Protein structure</subject>
              </subj-group>
            </subj-group>
          </subj-group>
        </subj-group>
        <subj-group subj-group-type="Discipline-v2">
          <subject>Chemistry</subject>
          <subj-group>
            <subject>Computational chemistry</subject>
            <subj-group>
              <subject>Molecular mechanics</subject>
            </subj-group>
          </subj-group>
        </subj-group>
        <subj-group subj-group-type="Discipline">
          <subject>Chemistry</subject>
          <subject>Computational Biology</subject>
          <subject>Biophysics</subject>
          <subject>Biochemistry</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Binding Pocket Optimization by Computational Protein Design</article-title>
        <alt-title alt-title-type="running-head">Computational Design of Binding Pockets</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Malisi</surname>
            <given-names>Christoph</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Schumann</surname>
            <given-names>Marcel</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">
            <sup>2</sup>
          </xref>
          <xref ref-type="fn" rid="fn2">
            <sup>¤b</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Toussaint</surname>
            <given-names>Nora C.</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">
            <sup>2</sup>
          </xref>
          <xref ref-type="fn" rid="fn1">
            <sup>¤a</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Kageyama</surname>
            <given-names>Jorge</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Kohlbacher</surname>
            <given-names>Oliver</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">
            <sup>2</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Höcker</surname>
            <given-names>Birte</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1">
            <sup>*</sup>
          </xref>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <addr-line>Max Planck Institute for Developmental Biology, Tübingen, Germany</addr-line>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <addr-line>Center for Bioinformatics, Quantitative Biology Center, and Department of Computer Science, University of Tübingen, Tübingen, Germany</addr-line>
      </aff>
      <contrib-group>
        <contrib contrib-type="editor" xlink:type="simple">
          <name name-style="western">
            <surname>Levy</surname>
            <given-names>Yaakov Koby</given-names>
          </name>
          <role>Editor</role>
          <xref ref-type="aff" rid="edit1"/>
        </contrib>
      </contrib-group>
      <aff id="edit1">
        <addr-line>Weizmann Institute of Science, Israel</addr-line>
      </aff>
      <author-notes>
        <corresp id="cor1">* E-mail: <email xlink:type="simple">birte.hoecker@tuebingen.mpg.de</email></corresp>
        <fn fn-type="conflict">
          <p>The authors have declared that no competing interests exist.</p>
        </fn>
        <fn fn-type="con">
          <p>Conceived and designed the experiments: CM OK BH. Performed the experiments: CM JK. Analyzed the data: CM OK BH. Contributed reagents/materials/analysis tools: MS NT. Wrote the paper: CM BH.</p>
        </fn>
        <fn id="fn1" fn-type="current-aff">
          <label>¤a</label>
          <p>Current address: Department of Pharmaceutical Sciences, School of Pharmacy, Thomas Jefferson University, Philadelphia, Pennsylvania, United States of America</p>
        </fn>
        <fn id="fn2" fn-type="current-aff">
          <label>¤b</label>
          <p>Current address: Immunology Program &amp; Computational Biology Program, Lucille Castori Center for Microbes, Inflammation &amp; Cancer, Memorial Sloan-Kettering Cancer Center, New York, New York, United States of America</p>
        </fn>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2012</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>27</day>
        <month>12</month>
        <year>2012</year>
      </pub-date>
      <volume>7</volume>
      <issue>12</issue>
      <elocation-id>e52505</elocation-id>
      <history>
        <date date-type="received">
          <day>25</day>
          <month>7</month>
          <year>2012</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>11</month>
          <year>2012</year>
        </date>
      </history>
      <permissions>
        <copyright-year>2012</copyright-year>
        <copyright-holder>Malisi et al</copyright-holder>
        <license xlink:type="simple">
          <license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Engineering specific interactions between proteins and small molecules is extremely useful for biological studies, as these interactions are essential for molecular recognition. Furthermore, many biotechnological applications are made possible by such an engineering approach, ranging from biosensors to the design of custom enzyme catalysts. Here, we present a novel method for the computational design of protein-small ligand binding named P<sc>ocket</sc>O<sc>ptimizer</sc>. The program can be used to modify protein binding pocket residues to improve or establish binding of a small molecule. It is a modular pipeline based on a number of customizable molecular modeling tools to predict mutations that alter the affinity of a target protein to its ligand. At its heart it uses a receptor-ligand scoring function to estimate the binding free energy between protein and ligand. We compiled a benchmark set that we used to systematically assess the performance of our method. It consists of proteins for which mutational variants with different binding affinities for their ligands and experimentally determined structures exist. Within this test set P<sc>ocket</sc>O<sc>ptimizer</sc> correctly predicts the mutant with the higher affinity in about 69% of the cases. A detailed analysis of the results reveals that the strengths of P<sc>ocket</sc>O<sc>ptimizer</sc> lie in the correct introduction of stabilizing hydrogen bonds to the ligand, as well as in the improved geometric complemetarity between ligand and binding pocket. Apart from the novel method for binding pocket design we also introduce a much needed benchmark data set for the comparison of affinities of mutant binding pockets, and that we use to asses programs for <italic>in silico</italic> design of ligand binding.</p>
      </abstract>
      <funding-group>
        <funding-statement>This work was supported by Deutsche Forschungsgemeinschaft Grant HO 4022/2-1. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
      </funding-group>
      <counts>
        <page-count count="9"/>
      </counts>
    </article-meta>
  </front>
  <body>
    <sec id="s1">
      <title>Introduction</title>
      <p>Computational protein design has advanced rapidly in recent years. A particularly exciting and dynamic area is the design of interactions between proteins and small molecule ligands. This includes the design of receptors that bind ligands of choice, which for example can be used as biosensors <xref ref-type="bibr" rid="pone.0052505-ValleBlisle1">[1]</xref>, as well as the design of enzymes that do not only bind a substrate, but also contain the catalytic machinery to process it <xref ref-type="bibr" rid="pone.0052505-Benson1">[2]</xref>–<xref ref-type="bibr" rid="pone.0052505-Bolon1">[3]</xref>. In all these designs, an existing protein is used as a scaffold, and its binding pocket is altered or a new one is introduced that should interact with the target ligand.</p>
      <p>With this approach, enzymes have been designed that catalyze chemical reactions for which no natural catalysts exist, such as a kemp eliminase <xref ref-type="bibr" rid="pone.0052505-Rthlisberger1">[4]</xref>–<xref ref-type="bibr" rid="pone.0052505-Korendovych1">[5]</xref>, a diels-alderase <xref ref-type="bibr" rid="pone.0052505-Siegel1">[6]</xref>, and a retro-aldolase <xref ref-type="bibr" rid="pone.0052505-Jiang1">[7]</xref>. It has also been used to design a metalloenzyme by repurposing parts of the already existing catalytic machinery in the scaffold protein, namely the reactivity of a zinc metal center to hydrolyze organophosphates <xref ref-type="bibr" rid="pone.0052505-Khare1">[8]</xref>. Furthermore, similar methods have been applied to change substrate specificities as well as affinities. For example human guanine deaminase was changed to bind ammelide through the remodeling of a loop that now provides a key interaction to the new target substrate <xref ref-type="bibr" rid="pone.0052505-Murphy1">[9]</xref>, the substrate specificity of gramicidin S synthetase was changed from phenylalanine to leucine <xref ref-type="bibr" rid="pone.0052505-Chen1">[10]</xref>, and mutations in dihydrofolate reductase from <italic>Staphylococcus aureus</italic> were predicted that decrease binding to an inhibitor molecule while stabilizing native protein function <xref ref-type="bibr" rid="pone.0052505-Frey1">[11]</xref>.</p>
      <p>While these are impressive results, there is still much room for improvement in the computational methods. Specifically, it seems to be difficult to accurately design a protein for high affinity binding to a ligand or transition state <xref ref-type="bibr" rid="pone.0052505-Schreier1">[12]</xref>. The majority of the enzyme designs mentioned have low affinities for their substrates when compared to naturally occurring enzymes <xref ref-type="bibr" rid="pone.0052505-Baker1">[13]</xref>–<xref ref-type="bibr" rid="pone.0052505-Wang1">[14]</xref>. In a rare report of a failed attempt, the unsuccessful design of a high-affinity ligand binding site for a D-Ala- D-Ala dipeptide into an endo-1,4-xylanase scaffold was discussed. Designs by the employed design software R<sc>osetta</sc> did not show the predicted high affinity in the experimental tests underscoring the challenge of protein-ligand interface design <xref ref-type="bibr" rid="pone.0052505-Morin1">[15]</xref>. In this respect long-range electrostatics and dynamics, accurate modeling of solvation and electrostatics at the interface, as well as the inclusion of explicit water molecules have been named as most problematic areas <xref ref-type="bibr" rid="pone.0052505-Baker1">[13]</xref>–<xref ref-type="bibr" rid="pone.0052505-Morin2">[16]</xref>. In order to improve protein-ligand interface design and to overcome current limitations it will be necessary to test design protocols more systematically.</p>
      <p>In this respect, we noticed that in computational design studies there is a lack of more general benchmark sets. Related molecular modeling techniques are regularly assessed using test sets. For example protein-ligand docking algorithms have been compared in detail <xref ref-type="bibr" rid="pone.0052505-Plewczynski1">[17]</xref>–<xref ref-type="bibr" rid="pone.0052505-Cole1">[18]</xref> <xref ref-type="bibr" rid="pone.0052505-Zavodszky1">[19]</xref>–<xref ref-type="bibr" rid="pone.0052505-Perola1">[20]</xref>. Also the CASP and CAPRI experiments allow unbiased testing of protein structure prediction and protein-protein docking methods <xref ref-type="bibr" rid="pone.0052505-Moult1">[21]</xref>. In contrast only a few computational design studies tested their employed methodology. One example is the redesign of the binding pocket of ribose binding protein for its native ligand using molecular mechanics methods. Among the resulting binding pocket sequences, the wild type sequence was ranked second best, while the first and third ranks had only a single mutation and bound ribose with tenfold decreased affinity <xref ref-type="bibr" rid="pone.0052505-Boas1">[22]</xref>. Also the aforementioned algorithm to introduce one key interaction to a ligand using loop modeling techniques was tested on eight proteins. For six of them the method produced a loop of the same length and similar configuration as in the crystal structures <xref ref-type="bibr" rid="pone.0052505-Murphy1">[9]</xref>. Both benchmark tests are very specific, they cannot be used to generally and systematically assess a method’s proficiency in designing binding to a small molecule. Also the broader benchmark set that was used to assess the ability of the enzyme design methods R<sc>osetta</sc>M<sc>atch</sc> and S<sc>caffold</sc>S<sc>election</sc> to identify suitable scaffold proteins that can host a desired catalytic machinery <xref ref-type="bibr" rid="pone.0052505-Zanghellini1">[23]</xref>–<xref ref-type="bibr" rid="pone.0052505-Malisi1">[24]</xref> are not suited for this purpose. Such a test set, however, would be very helpful for assessing the potential and the shortcomings of available methods.</p>
      <p>In this study, we present P<sc>ocket</sc>O<sc>ptimizer</sc>, a computational pipeline that can be used to predict mutations in the binding pocket of proteins, which increase the affinity of the protein to a given small molecule ligand. It can be used for the analysis of few mutations as well as for the design of an entire binding pocket. It uses several molecular modeling modules. Side chain flexibility is sampled by a conformer library, which we compiled following Boas and Harbury <xref ref-type="bibr" rid="pone.0052505-Boas1">[22]</xref>. The use of conformer libraries has been reported to be advantageous, especially in the context of binding-site geometries <xref ref-type="bibr" rid="pone.0052505-Shetty1">[25]</xref> <xref ref-type="bibr" rid="pone.0052505-Lassila1">[26]</xref>–<xref ref-type="bibr" rid="pone.0052505-Xiang1">[27]</xref>. A receptor-ligand scoring function is used to calculate protein ligand binding strength. The modular architecture of P<sc>ocket</sc>O<sc>ptimizer</sc> allows easy and systematic comparison of methods that perform the same task. As the first test we utilize this to examine two scoring functions in this study, the scoring function provided by CADDSuite <xref ref-type="bibr" rid="pone.0052505-Schumann1">[28]</xref> and Autodock Vina <xref ref-type="bibr" rid="pone.0052505-Trott1">[29]</xref>. In order to assess the performance of P<sc>ocket</sc>O<sc>ptimizer</sc> and other methods that address the same task, we compiled a benchmark set. It consists of mutational variants of proteins and their small ligands with available experimental structural and binding affinity data. We also used this benchmark to test the enzyme design application included in the R<sc>osetta</sc> molecular modeling software. R<sc>osetta</sc> was used for the majority of the design studies mentioned earlier, and it is the most successful freely available protein design software to date <xref ref-type="bibr" rid="pone.0052505-Richter1">[30]</xref>. We find that both methods perform similarly. In our benchmark P<sc>ocket</sc>O<sc>ptimizer</sc> succeeds slightly better in predicting the correct affinity-enhancing mutations. We discuss the strengths and weaknesses of our method and describe to which protein design problems it can be applied with good chances of success. The findings emphasize the merit of a systematic approach to evaluate computational protein design methodologies, to identify their strengths, and to pinpoint possibilities for improvement. And our modular program P<sc>ocket</sc>O<sc>ptimizer</sc> provides a suitable framework to test and implement these approaches.</p>
    </sec>
    <sec id="s2">
      <title>Results and Discussion</title>
      <sec id="s2a">
        <title>Computational Receptor Design Pipeline PocketOptimizer</title>
        <p>We developed P<sc>ocket</sc>O<sc>ptimizer</sc> for the design of protein-ligand interactions. In combination with a program such as S<sc>caffold</sc>S<sc>election</sc> <xref ref-type="bibr" rid="pone.0052505-Malisi1">[24]</xref> it can also be used for enzyme design. P<sc>ocket</sc>O<sc>ptimizer</sc> is a combination of customizable molecular modeling components. Amino acid flexibility is modeled by a side chain conformer library, ligand flexibility is addressed by systematically sampling poses of the ligand in the binding pocket. The score that is optimized is a combination of protein packing energy calculated with the AMBER force field <xref ref-type="bibr" rid="pone.0052505-Ponder1">[31]</xref>, and protein-ligand binding energy calculated using a scoring function. To identify the most promising design, the global minimum energy conformation of a protein pocket with the ligand based on the combined energy score is calculated <xref ref-type="bibr" rid="pone.0052505-Kingsford1">[32]</xref>–<xref ref-type="bibr" rid="pone.0052505-Sontag1">[33]</xref>. Intermediate results like conformers or score tables are stored in standard file formats, making it easy to compare different approaches for a given subtask. Notably, we used two receptor-ligand scoring functions in this study, the scoring function included in CADDSuite <xref ref-type="bibr" rid="pone.0052505-Schumann1">[28]</xref> and Autodock Vina <xref ref-type="bibr" rid="pone.0052505-Trott1">[29]</xref>. <xref ref-type="fig" rid="pone-0052505-g001">Figure 1</xref> depicts the workflow of the P<sc>ocket</sc>O<sc>ptimizer</sc> pipeline.</p>
        <fig id="pone-0052505-g001" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0052505.g001</object-id>
          <label>Figure 1</label>
          <caption>
            <title>Workflow of PocketOptimizer.</title>
            <p>The input specific for a design is depicted in circles, parts of the pipeline are shown in pointed rectangles, and output components in rounded rectangles. The output is stored in standard file formats (SDF and PDB for structural data, csv for energy tables). This allows the easy replacement of a component with another that solves the same task (e.g. replacing the binding score function).</p>
          </caption>
          <graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0052505.g001" position="float" xlink:type="simple"/>
        </fig>
        <p>The program P<sc>ocket</sc>O<sc>ptimizer</sc> is designed as a modular pipeline that allows exchange of program parts, e.g. the use of different available docking functions or force-fields. In contrast to other existing design programs this pipeline aims to provide a platform for the incorporation and testing of available modules so that the contribution of individual parts can be distinguished. In its current implementation of P<sc>ocket</sc>O<sc>ptimizer</sc> we chose to use a conformer library over rotamers. The program is geared towards the design of protein-ligand interaction, however it can also be used for prediction of protein packing only. Currently not incorporated are backbone flexibility and negative design capabilities.</p>
        <p>P<sc>ocket</sc>O<sc>ptimizer</sc> source code and documentation can be obtained from the authors or from <ext-link ext-link-type="uri" xlink:href="http://www.eb.mpg.de/research-groups/birte-hoecker/algorithms-and-software.html" xlink:type="simple">www.eb.mpg.de/research-groups/birte-hoecker/algorithms-and-software.html</ext-link>.</p>
      </sec>
      <sec id="s2b">
        <title>Benchmark Set</title>
        <p>We compiled a set of twelve proteins with structural and experimental affinity data for the assessment of computational design methods for protein-ligand binding. For this, we systematically searched the PDBbind database <xref ref-type="bibr" rid="pone.0052505-Wang2">[34]</xref>, which lists high quality crystal structures of protein-ligand complexes together with experimentally determined binding data. Each protein in our set has at least two mutational variants (usually the wild type and one or more mutants) accompanied by an affinity measure (the inhibitory constant <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e001" xlink:type="simple"/></inline-formula> or dissociation constant <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e002" xlink:type="simple"/></inline-formula>) for the same ligand. The positions of amino acids that differ between the variants are always located in the binding pocket or active site. For each protein, there is at least one crystal structure of a variant with the ligand, for ten of the twelve there are two or more crystal structures that allow us to compare a design model of a variant with the respective crystal structure. The proteins and ligands in our benchmark set are very diverse. All ligands are shown in <xref ref-type="fig" rid="pone-0052505-g002">Figure 2</xref>. Each protein in the set belongs to a different fold as defined by SCOP <xref ref-type="bibr" rid="pone.0052505-Murzin1">[35]</xref>, underscoring their structural diversity. This diversity allows to test design methods on a wide range of problems and avoids bias. <xref ref-type="table" rid="pone-0052505-t001">Table 1</xref> lists the benchmark proteins and their associated data.</p>
        <fig id="pone-0052505-g002" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0052505.g002</object-id>
          <label>Figure 2</label>
          <caption>
            <title>Two-dimensional structures of benchmark set ligands.</title>
            <p>The ligands of the test cases of our benchmark sets. See <xref ref-type="table" rid="pone-0052505-t001">Table 1</xref> for which ligand belongs to which test case.</p>
          </caption>
          <graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0052505.g002" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap id="pone-0052505-t001" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0052505.t001</object-id>
          <label>Table 1</label>
          <caption>
            <title>Benchmark set.</title>
          </caption>
          <alternatives>
            <graphic id="pone-0052505-t001-1" position="float" mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0052505.t001" xlink:type="simple"/>
            <table>
              <colgroup span="1">
                <col align="left" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
              </colgroup>
              <thead>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td colspan="3" align="left" rowspan="1">Mutants</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Protein</td>
                  <td align="left" rowspan="1" colspan="1">Ligand</td>
                  <td align="left" rowspan="1" colspan="1">Positions</td>
                  <td align="left" rowspan="1" colspan="1">AA</td>
                  <td align="left" rowspan="1" colspan="1">aff. [nM]</td>
                  <td align="left" rowspan="1" colspan="1">PDB</td>
                </tr>
              </thead>
              <tbody>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">F</td>
                  <td align="left" rowspan="1" colspan="1">5.8</td>
                  <td align="left" rowspan="1" colspan="1">1ydb</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">W</td>
                  <td align="left" rowspan="1" colspan="1">8.6</td>
                  <td align="left" rowspan="1" colspan="1">–</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">L</td>
                  <td align="left" rowspan="1" colspan="1">9.6</td>
                  <td align="left" rowspan="1" colspan="1">–</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">R</td>
                  <td align="left" rowspan="1" colspan="1">86</td>
                  <td align="left" rowspan="1" colspan="1">1ydd</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Carbonic anhydrase II</td>
                  <td align="left" rowspan="1" colspan="1">Acetazolamide</td>
                  <td align="left" rowspan="1" colspan="1">198</td>
                  <td align="left" rowspan="1" colspan="1">E</td>
                  <td align="left" rowspan="1" colspan="1">280</td>
                  <td align="left" rowspan="1" colspan="1">1yda</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">D</td>
                  <td align="left" rowspan="1" colspan="1">53</td>
                  <td align="left" rowspan="1" colspan="1">2pql</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">D7r4 amine binding protein</td>
                  <td align="left" rowspan="1" colspan="1">Tryptamine</td>
                  <td align="left" rowspan="1" colspan="1">111</td>
                  <td align="left" rowspan="1" colspan="1">L</td>
                  <td align="left" rowspan="1" colspan="1">inf</td>
                  <td align="left" rowspan="1" colspan="1">–</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">E</td>
                  <td align="left" rowspan="1" colspan="1">0.29</td>
                  <td align="left" rowspan="1" colspan="1">1gwr</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">Q</td>
                  <td align="left" rowspan="1" colspan="1">3.53</td>
                  <td align="left" rowspan="1" colspan="1"/>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"><inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e003" xlink:type="simple"/></inline-formula>Estrogen receptor</td>
                  <td align="left" rowspan="1" colspan="1">Estradiol</td>
                  <td align="left" rowspan="1" colspan="1">353</td>
                  <td align="left" rowspan="1" colspan="1">A</td>
                  <td align="left" rowspan="1" colspan="1">60</td>
                  <td align="left" rowspan="1" colspan="1">–</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">FIFI</td>
                  <td align="left" rowspan="1" colspan="1">0.4</td>
                  <td align="left" rowspan="1" colspan="1">1met</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">VIVI</td>
                  <td align="left" rowspan="1" colspan="1">0.8</td>
                  <td align="left" rowspan="1" colspan="1">–</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">VVVV</td>
                  <td align="left" rowspan="1" colspan="1">20</td>
                  <td align="left" rowspan="1" colspan="1">1mes</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">HIV-1 protease</td>
                  <td align="left" rowspan="1" colspan="1">DMP323</td>
                  <td align="left" rowspan="1" colspan="1">A:82, A:84, B:82, B:84</td>
                  <td align="left" rowspan="1" colspan="1">FVFV</td>
                  <td align="left" rowspan="1" colspan="1">800</td>
                  <td align="left" rowspan="1" colspan="1">1meu</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">N</td>
                  <td align="left" rowspan="1" colspan="1">810</td>
                  <td align="left" rowspan="1" colspan="1">1ogx</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Ketosteroid isomerase</td>
                  <td align="left" rowspan="1" colspan="1">Equilenin</td>
                  <td align="left" rowspan="1" colspan="1">240</td>
                  <td align="left" rowspan="1" colspan="1">D</td>
                  <td align="left" rowspan="1" colspan="1">45750</td>
                  <td align="left" rowspan="1" colspan="1">1oh0</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">AG</td>
                  <td align="left" rowspan="1" colspan="1">2780</td>
                  <td align="left" rowspan="1" colspan="1">2jdn</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Lectin II</td>
                  <td align="left" rowspan="1" colspan="1">O1-methyl-mannose</td>
                  <td align="left" rowspan="1" colspan="1">22, 24</td>
                  <td align="left" rowspan="1" colspan="1">SN</td>
                  <td align="left" rowspan="1" colspan="1">42900</td>
                  <td align="left" rowspan="1" colspan="1">2jdy</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">H</td>
                  <td align="left" rowspan="1" colspan="1">2000</td>
                  <td align="left" rowspan="1" colspan="1">1egh</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">N</td>
                  <td align="left" rowspan="1" colspan="1">5800</td>
                  <td align="left" rowspan="1" colspan="1">1s89</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Methylglyoxal synthase</td>
                  <td align="left" rowspan="1" colspan="1">2-Phospho-gylcolate</td>
                  <td align="left" rowspan="1" colspan="1">98</td>
                  <td align="left" rowspan="1" colspan="1">Q</td>
                  <td align="left" rowspan="1" colspan="1">46000</td>
                  <td align="left" rowspan="1" colspan="1">1s8a</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">H</td>
                  <td align="left" rowspan="1" colspan="1">0.32</td>
                  <td align="left" rowspan="1" colspan="1">2hu4</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Neuroaminidase test 1</td>
                  <td align="left" rowspan="1" colspan="1">Oseltamivir</td>
                  <td align="left" rowspan="1" colspan="1">274</td>
                  <td align="left" rowspan="1" colspan="1">Y</td>
                  <td align="left" rowspan="1" colspan="1">84.8</td>
                  <td align="left" rowspan="1" colspan="1">3cl0</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">N</td>
                  <td align="left" rowspan="1" colspan="1">0.32</td>
                  <td align="left" rowspan="1" colspan="1">2hu4</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Neuroaminidase test 2</td>
                  <td align="left" rowspan="1" colspan="1">Oseltamivir</td>
                  <td align="left" rowspan="1" colspan="1">294</td>
                  <td align="left" rowspan="1" colspan="1">S</td>
                  <td align="left" rowspan="1" colspan="1">25.9</td>
                  <td align="left" rowspan="1" colspan="1">3cl2</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">H</td>
                  <td align="left" rowspan="1" colspan="1">0.01</td>
                  <td align="left" rowspan="1" colspan="1">1rsz</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">G</td>
                  <td align="left" rowspan="1" colspan="1">0.27</td>
                  <td align="left" rowspan="1" colspan="1">2a0w</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">D</td>
                  <td align="left" rowspan="1" colspan="1">0.9</td>
                  <td align="left" rowspan="1" colspan="1">2a0y</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Purine nucleoside phosphorylase</td>
                  <td align="left" rowspan="1" colspan="1">DADMe-Immucillin-H</td>
                  <td align="left" rowspan="1" colspan="1">257</td>
                  <td align="left" rowspan="1" colspan="1">F</td>
                  <td align="left" rowspan="1" colspan="1">0.95</td>
                  <td align="left" rowspan="1" colspan="1">2a0x</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">N</td>
                  <td align="left" rowspan="1" colspan="1">0.0001</td>
                  <td align="left" rowspan="1" colspan="1">1swe</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">E</td>
                  <td align="left" rowspan="1" colspan="1">0.0069</td>
                  <td align="left" rowspan="1" colspan="1">–</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Streptavidin test 1</td>
                  <td align="left" rowspan="1" colspan="1">Biotin</td>
                  <td align="left" rowspan="1" colspan="1">s23</td>
                  <td align="left" rowspan="1" colspan="1">A</td>
                  <td align="left" rowspan="1" colspan="1">0.028</td>
                  <td align="left" rowspan="1" colspan="1">1n43</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">S</td>
                  <td align="left" rowspan="1" colspan="1">0.0001</td>
                  <td align="left" rowspan="1" colspan="1">1swe</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Streptavidin test 2</td>
                  <td align="left" rowspan="1" colspan="1">Biotin</td>
                  <td align="left" rowspan="1" colspan="1">27</td>
                  <td align="left" rowspan="1" colspan="1">A</td>
                  <td align="left" rowspan="1" colspan="1">0.01</td>
                  <td align="left" rowspan="1" colspan="1">1n9m</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">C</td>
                  <td align="left" rowspan="1" colspan="1">490</td>
                  <td align="left" rowspan="1" colspan="1">1nja</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">D</td>
                  <td align="left" rowspan="1" colspan="1">2800</td>
                  <td align="left" rowspan="1" colspan="1">1njc</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Thymidylate synthase</td>
                  <td align="left" rowspan="1" colspan="1">dCMP</td>
                  <td align="left" rowspan="1" colspan="1">229</td>
                  <td align="left" rowspan="1" colspan="1">N</td>
                  <td align="left" rowspan="1" colspan="1">160000</td>
                  <td align="left" rowspan="1" colspan="1">1nje</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">DG</td>
                  <td align="left" rowspan="1" colspan="1">12000</td>
                  <td align="left" rowspan="1" colspan="1">1ane</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Trypsin</td>
                  <td align="left" rowspan="1" colspan="1">Benzamidine</td>
                  <td align="left" rowspan="1" colspan="1">189, 226</td>
                  <td align="left" rowspan="1" colspan="1">GD</td>
                  <td align="left" rowspan="1" colspan="1">15000000</td>
                  <td align="left" rowspan="1" colspan="1">1bra</td>
                </tr>
              </tbody>
            </table>
          </alternatives>
          <table-wrap-foot>
            <fn id="nt101">
              <label/>
              <p>Each row lists a test case. Columns <bold>Protein</bold> and <bold>Ligand</bold> contain the name of protein or ligand, <bold>Positions</bold> the indices of the mutable positions (for HIV protease along with the chain identifier, in the other cases the pocket is formed by one chain only), <bold>Mutants</bold> lists the variants: in subcolumn <bold>AA</bold> the amino acids at the mutable positions, in <bold>aff.</bold> the affinities of the variants, and in <bold>PDB</bold> the PDB identifier of the corresponding crystal structure, should one exist.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec id="s2c">
        <title>Benchmark Results</title>
        <p>The optimization scheme of P<sc>ocket</sc>O<sc>ptimizer</sc> simultaneously chooses sequence and conformation. It can go over many alternatives. For the benchmark, however, it was necessary to restrict the sequence to the mutations for which experimental data was available. We tested the performance of P<sc>ocket</sc>O<sc>ptimizer</sc> on the benchmark set using Autodock Vina and CADDSuite receptor-ligand scores as well as R<sc>osetta</sc>’s enzyme design application. Each method was used for the same set of design calculations. Each available crystal structure was used as a scaffold for the design of each mutational variant. We obtained a design for each mutation in each scaffold structure by forcing the methods to select a particular mutation in a separate run. This allowed us to compare the predicted binding and total energy scores as well as the designed conformations with the experimental data. <xref ref-type="fig" rid="pone-0052505-g003">Figure 3</xref> shows the RMSD values between the designs and the respective crystal structures. This is a measure of how well the respective method models the conformation of the binding pocket residues and the ligand pose in the pocket. R<sc>osetta</sc> performs better in modeling side chains in the binding pocket. The difference between the pocket RMSDs of R<sc>osetta</sc> and each of the two P<sc>ocket</sc>O<sc>ptimizer</sc> variants is statistically significant with a p-value &lt;0.01 according to a Mann-Whitney test. This might not come as a surprise considering that the R<sc>osetta</sc> molecular modeling software is extensively used and optimized for protein packing tasks, especially protein structure prediction. P<sc>ocket</sc>O<sc>ptimizer</sc> on the other hand focuses on the identification of residues interacting favorably with the ligand. The observed differences in ligand pose RMSD are not statistically significant (<xref ref-type="fig" rid="pone-0052505-g003">Figure 3</xref>). To assess whether the methods can differentiate correctly between protein variants that have a large affinity difference, we looked at pairs that have an affinity difference of at least 50-fold. This cutoff translates to roughly 2.3 kcal/mole and was chosen to make sure that only pairs with clear, trustworthy affinity differences well outside experimental error are investigated. <xref ref-type="table" rid="pone-0052505-t002">Table 2</xref> lists the number of pairs in which the order of the mutants according to energy score is the same as the order according to affinity, meaning the design method would produce the correct ranking. Here, P<sc>ocket</sc>O<sc>ptimizer</sc> performs in the same range as R<sc>osetta</sc>, with 69% correctly predicted pairs opposed to 64%. When comparing the two receptor-ligand score functions we used in our approach it seems that Autodock Vina has some advantage over the CADDSuite score. The total scores of the different methods are also listed. Based on these scores P<sc>ocket</sc>O<sc>ptimizer</sc> performs even better with 71% and 76% correctly predicted pairs. However, since we are looking at affinity prediction, the binding score appears to be more appropriate for the comparison.</p>
        <fig id="pone-0052505-g003" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0052505.g003</object-id>
          <label>Figure 3</label>
          <caption>
            <title>Differences of the ligand poses and pocket side chains in the benchmark designs compared to the crystal structures.</title>
            <p>The upper graph shows the average RMSDs and standard deviation between the ligand pose in the designs and in the crystal structures. The lower graph shows the average RMSD and standard deviation between the binding pocket side chain heavy atoms of designs and the corresponding crystal structure. The RMSDs are calculated after superimposing the structures using the backbone to make sure that the differences come from pocket/ligand pose differences only. RMSD from P<sc>ocket</sc>O<sc>ptimizer</sc> CADDSuite score designs are plotted in blue, from P<sc>ocket</sc>O<sc>ptimizer</sc> vina designs in green, and from Rosetta designs in red. Each point marks the average RMSD for all designs of a test case usign one score. The number of designs that contribute to a value depends on the number of mutations with a crystal structure, it is the square of this number (because each structure is used as a design scaffold for each mutation). Test cases are: <italic>CA</italic>: Carbonic anhydrase II, <italic>ABP</italic> D7r4 amine binding protein, <italic>ER</italic>: Estrogen receptor <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e004" xlink:type="simple"/></inline-formula>, <italic>HP</italic>: HIV-1 protease, <italic>KI</italic>: Ketosteroid isomerase, <italic>L</italic>: Lectin, <italic>MS</italic>: Methylglyoxal synthase, <italic>N1</italic>: Neuroaminidase test 1, <italic>N2</italic>: Neuroaminidase test 2, <italic>PNP</italic>: Purine nucleoside phosphorylase, <italic>S1</italic>: Streptavidin test 1, <italic>S2</italic>: Streptavidin test 2, <italic>TS</italic>: Thymidylate synthase, <italic>T</italic>: Trypsin.</p>
          </caption>
          <graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0052505.g003" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap id="pone-0052505-t002" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0052505.t002</object-id>
          <label>Table 2</label>
          <caption>
            <title>Order of designs by predicted binding score.</title>
          </caption>
          <alternatives>
            <graphic id="pone-0052505-t002-2" position="float" mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0052505.t002" xlink:type="simple"/>
            <table>
              <colgroup span="1">
                <col align="left" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
                <col align="center" span="1"/>
              </colgroup>
              <thead>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Test Cases</td>
                  <td colspan="2" align="left" rowspan="1">CADDSuite</td>
                  <td colspan="2" align="left" rowspan="1">Vina</td>
                  <td colspan="2" align="left" rowspan="1">Rosetta</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1"/>
                  <td align="left" rowspan="1" colspan="1">Total</td>
                  <td align="left" rowspan="1" colspan="1">Binding</td>
                  <td align="left" rowspan="1" colspan="1">Total</td>
                  <td align="left" rowspan="1" colspan="1">Binding</td>
                  <td align="left" rowspan="1" colspan="1">Total</td>
                  <td align="left" rowspan="1" colspan="1">Binding</td>
                </tr>
              </thead>
              <tbody>
                <tr>
                  <td align="left" rowspan="1" colspan="1">D7r4 amine binding protein</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Estrogen receptor</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                  <td align="left" rowspan="1" colspan="1">1/1</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">HIV-1 protease</td>
                  <td align="left" rowspan="1" colspan="1">6/9</td>
                  <td align="left" rowspan="1" colspan="1">6/9</td>
                  <td align="left" rowspan="1" colspan="1">9/9</td>
                  <td align="left" rowspan="1" colspan="1">9/9</td>
                  <td align="left" rowspan="1" colspan="1">5/9</td>
                  <td align="left" rowspan="1" colspan="1">8/9</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Ketosteroid isomerase</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Neuroaminidase test 1</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Neuroaminidase test 2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">½</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Purine nucleoside phosphorylase</td>
                  <td align="left" rowspan="1" colspan="1">6/8</td>
                  <td align="left" rowspan="1" colspan="1">6/8</td>
                  <td align="left" rowspan="1" colspan="1">7/8</td>
                  <td align="left" rowspan="1" colspan="1">6/8</td>
                  <td align="left" rowspan="1" colspan="1">4/8</td>
                  <td align="left" rowspan="1" colspan="1">2/8</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Streptavidin test 1</td>
                  <td align="left" rowspan="1" colspan="1">4/4</td>
                  <td align="left" rowspan="1" colspan="1">4/4</td>
                  <td align="left" rowspan="1" colspan="1">4/4</td>
                  <td align="left" rowspan="1" colspan="1">4/4</td>
                  <td align="left" rowspan="1" colspan="1">3/4</td>
                  <td align="left" rowspan="1" colspan="1">3/4</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Streptavidin test 2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">2/2</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Thymidylate synthase</td>
                  <td align="left" rowspan="1" colspan="1">1/6</td>
                  <td align="left" rowspan="1" colspan="1">0/6</td>
                  <td align="left" rowspan="1" colspan="1">1/6</td>
                  <td align="left" rowspan="1" colspan="1">0/6</td>
                  <td align="left" rowspan="1" colspan="1">6/6</td>
                  <td align="left" rowspan="1" colspan="1">3/6</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">Trypsin</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                  <td align="left" rowspan="1" colspan="1">½</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                  <td align="left" rowspan="1" colspan="1">0/2</td>
                  <td align="left" rowspan="1" colspan="1">1/2</td>
                </tr>
                <tr>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>Mean</bold>
                  </td>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>70.8%</bold>
                  </td>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>65.6%</bold>
                  </td>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>75.5%</bold>
                  </td>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>68.8%</bold>
                  </td>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>63.5%</bold>
                  </td>
                  <td align="left" rowspan="1" colspan="1">
                    <bold>63.5%</bold>
                  </td>
                </tr>
              </tbody>
            </table>
          </alternatives>
          <table-wrap-foot>
            <fn id="nt102">
              <label/>
              <p><bold>Numbers of correctly ranked design mutation pairs with large affinity difference.</bold> All mutation pairs for which there is an affinity difference of at least 50-fold are investigated. All design pairs with these mutations (i.e. for each of these pairs there are as many design pairs as scaffold crystal structures) are checked, if the order of the mutations by total score or binding score is the same order as by affinity. A cell shows the number of correctly ordered design pairs, and the number of all design pairs. The mean for this part is calculated by scaling the percentage of a test case by the number of mutation pairs (i.e. NOT by design pairs, which would bias the value too much towards test cases with many crystal structures).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We further examined how well the energy scores correlate with the affinities. For this we plotted the predicted energy of each design against the logarithmic affinities for all seven test cases with more than two mutations (<xref ref-type="fig" rid="pone-0052505-g004">Figure 4</xref>). The scores should correspond to the binding free energy, which in turn is proportional to the logarithm of the affinity of binding. Here, all mutants with experimental affinity values of a test case are included, regardless of the extent of the affinity difference. Overall we find that the energy values follow the affinity logarithm only in some cases.</p>
        <fig id="pone-0052505-g004" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0052505.g004</object-id>
          <label>Figure 4</label>
          <caption>
            <title>Comparison of the energy scores versus the affinities of the mutations show how well the programs reproduce the differences.</title>
            <p>For each test case with more than two mutations, we plotted the top binding scores of CADDSuite, Vina, and Rosetta designs for each mutation on each scaffold structure together with the logarithm of the affinity. Here we show plots for Carbonic anhydrase II, HIV-1 protease, and Streptavidin test 1. All other plots are shown in <xref ref-type="supplementary-material" rid="pone.0052505.s001">Information S1</xref>. Values are scaled to fit in the same range. Shown on the x-axis of a plot are the mutants in order of affinity to the ligand (the leftmost has the lowest affinity, compare <xref ref-type="table" rid="pone-0052505-t001">Table 1</xref> for the actual values). The y-axis measures predicted binding scores for the designs, and the log affinities, scaled between 0 and 1. Both are proportional to the binding free energy, and can therefore be compared when scaled to the same range. The lowest predicted binding score or log affinity is set to 0, the highest respective value to 1. Each plot contains a line for the affinity logarithm (solid, black no marker). This line represents the goal, if a method predicts binding well, the binding score lines should closely follow the log affinity line. The other markers and lines show the scaled predicted binding scores. One line represents the designs calculated for all available mutants, calculated by using one crystal structure as the scaffold. (Crystal structure 1: dashed, blue, circle markers; structure 2: red, dotted, square markers; structure 3: green, dash-dot pattern, diamond markers; structure 4: cyan, two dashes one dot pattern, star markers). We chose to use lines for representation, because this makes it easy to visually compare the shape of the black log affinity line to the lines representing the design binding scores. Each row has plots for one test case, in parentheses the order of scaffold structures is listed: <italic>CA</italic>: Carbonic anhydrase II (1ydb, 1yda, 1ydd), <italic>HP</italic>: HIV-1 protease (1met, 1meu, 1mes), <italic>S1</italic>: Streptavidin test 1 (1swe, 1n43).</p>
          </caption>
          <graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0052505.g004" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec id="s2d">
        <title>Discussion of Benchmark Results</title>
        <p>When looking at a pair of protein variants, P<sc>ocket</sc>O<sc>ptimizer</sc> is able to correctly predict which variant has a better binding affinity if that difference is based on the introduction or abolition of a direct interaction of the mutable residue’s side chain with the ligand. This is especially noteworthy for pairs where one residue forms a hydrogen bond with the ligand, while the other does not. This was predicted correctly in seven of eight cases where the better binding variant forms an additional hydrogen bond. It also works well if the variable side chain of one mutation variant is bulkier than its counterpart in another variant, and therefore packs better against the ligand, i.e. forms more van der Waals (vdW) interactions with the ligand and shields it better from solvent, improving the solvation energy contribution. A potential downside of this effect of vdW contact improvement is that P<sc>ocket</sc>O<sc>ptimizer</sc> sometimes seems to prefer larger side chains even if they are detrimental to binding for other reasons. This tendency could lead to an overpacking of the designed pocket. When differences in binding have more complex causes, such as rearrangements in the pocket’s side chains that affect the ligand interaction indirectly by influencing other pocket side chains, the program generally fails to capture these differences.</p>
        <p>Both scoring functions used within P<sc>ocket</sc>O<sc>ptimizer</sc>, from Autodock Vina and CADDSuite, produce results that are quite similar. The overpacking effect discussed before is less pronounced in Vina, which explains its slightly better performance in predicting which variant of a pair binds better (see <xref ref-type="table" rid="pone-0052505-t002">Table 2</xref>). Generally, the order of the designs by energy scores calculated by our method does not depend on which variant’s crystal structure was used as the scaffold. Only in a few cases a significant difference can be observed, notably for carbonic anhydrase II and trypsin.</p>
        <p>In some cases, the P<sc>ocket</sc>O<sc>ptimizer</sc> designs did not contain a conformational configuration that avoids vdW clashes in the binding pocket. In one test case, namely for neuroaminidase, the program was unable to identify any acceptable pocket conformation. One limitation of P<sc>ocket</sc>O<sc>ptimizer</sc> and a probable cause for such problems is the assumption of a fixed backbone in our designs. An adjustment of the backbone conformation might have helped to accommodate the tyrosine. It is also conceivable that our way of systematically sampling possible ligand poses could have failed to generate a pose that is sterically compatible in the neuroaminidase case.</p>
        <p>Rosetta’s enzyme design application does not suffer from unresolvable vdW clashes. It includes minimization steps in its algorithm that can resolve potential clashes introduced by discrete conformational sampling. However, Rosetta apparently cannot convey its superiority in modeling the binding pocket side chains to the prediction of the correct binding score order. It is unable to predict the rearrangements of side chain conformations that lead to binding affinity changes in the more complicated test cases. The energy term for hydrogen bonds in R<sc>osetta</sc> seems to have less influence on the output than in our program. This causes R<sc>osetta</sc> to miss existing hydrogen bonds between ligand and side chains. The binding scores and their differences predicted for different mutants are more dependent on the scaffold structure used in Rosetta designs than it is in P<sc>ocket</sc>O<sc>ptimizer</sc>. This can be seen in <xref ref-type="fig" rid="pone-0052505-g004">Figure 4:</xref> the lines for designs of both P<sc>ocket</sc>O<sc>ptimizer</sc> variants, Vina and CADDSuite, are more similar to each other than the ones for R<sc>osetta</sc> designs. This is rather surprising, as we anticipated that the limited backbone flexibility included in the R<sc>osetta</sc> enzyme design protocol would lead to less dependency on these small input structure differences.</p>
        <p>A more detailed description of each test case, including what is known from experimental and structural studies about the factors that influence binding differences in the test cases, as well as the success of the methods in reproducing these factors, is provided in the <xref ref-type="supplementary-material" rid="pone.0052505.s001">Information S1</xref>.</p>
      </sec>
      <sec id="s2e">
        <title>Conclusion</title>
        <p>We developed a pipeline of molecular modeling tools named P<sc>ocket</sc>O<sc>ptimizer</sc>. The program can be used to predict affinity altering mutations in existing protein binding pockets. For enzyme design applications it can be combined with a program such as S<sc>caffold</sc>S<sc>election</sc> <xref ref-type="bibr" rid="pone.0052505-Malisi1">[24]</xref>. In P<sc>ocket</sc>O<sc>ptimizer</sc> receptor-ligand scoring functions are used to assess binding. For its evaluation, we compiled a benchmark set of proteins for which crystal structures and experimental affinity data are available and that can be used to test our and other methodologies. We subjected P<sc>ocket</sc>O<sc>ptimizer</sc> as well as the state-of-the-art method R<sc>osetta</sc> to our benchmark test. The overall performance of both approaches was similar, but in detail both had different benefits. R<sc>osetta</sc> handles the conformational modeling of the binding pocket better, while P<sc>ocket</sc>O<sc>ptimizer</sc> has the advantage in predicting which of a pair of mutants of the same protein binds the ligand better. This prediction was correct in 66 or 69% of the tested cases using P<sc>ocket</sc>O<sc>ptimizer</sc> (CADDSuite or Vina score, respectively) and in 64% of the cases using R<sc>osetta</sc>.</p>
        <p>The results show that P<sc>ocket</sc>O<sc>ptimizer</sc> is a well performing tool for the design of protein-ligand interactions. It is especially suited for the introduction of a hydrogen bond if there is an unsatisfied hydrogen donor or acceptor group in the ligand, and for filling voids between the protein and the ligand to improve vdW interactions. For affinity design problems that require a more complex rearrangement of the binding pocket, e.g. a mutation making room for another side chain to interact with the ligand, none of the tested methods appear to perform well.</p>
        <p>There are also some other obvious effects that can influence binding, but that are not addressable with the current methods, e.g. protein dynamics or rearrangements of the backbone. Such problems are probably harder to address than the more complicated test cases dealt with in this study, so that we do not expect that current methods can tackle them with much success. Some apparent problems of P<sc>ocket</sc>O<sc>ptimizer</sc>, however, such as the occurrence of unresolvable steric clashes between ligand and side chains should be mendable by better sampling of the conformational space and the introduction of backbone flexibility <xref ref-type="bibr" rid="pone.0052505-Georgiev1">[36]</xref> <xref ref-type="bibr" rid="pone.0052505-Smith1">[37]</xref>–<xref ref-type="bibr" rid="pone.0052505-Kellogg1">[38]</xref>. It is conceivable that a continuous minimization step at the end of the design calculation could also be beneficial.</p>
        <p>In conclusion, it seems that although P<sc>ocket</sc>O<sc>ptimizer</sc> performs well, and even better in some respects than the state-of-the-art method R<sc>osetta</sc>, there is still room for improvement in computational design of protein-ligand binding. Our study highlights the usefulness of benchmark data sets and systematic testing in order to arrive at an informed assessment of computational design methods. In fact it would be interesting to test other available protein design schemes using our benchmark. A comparison of their performance should be very informative. Further, the benchmark will be useful in future test of parts of our modular design pipeline, e.g. by exchanging the force-field in P<sc>ocket</sc>O<sc>ptimizer</sc> its contribution can be tested rather than the overall design approach.</p>
        <p>When we started to compile our benchmark set, we were hoping for considerably more test cases. The fact that out of the 6,005 protein structures currently contained in the PDBbind database, only ten suitable test cases could be extracted (twelve if the double cases of neuroaminidase and streptavidin are counted), was rather surprising to us. This emphasizes the need for more benchmark data. Thus, an explicit effort to systematically create experimental and structural data is required. For protein-ligand interaction design it would be desirable to have data that covers many mutations of several pocket positions, ideally also of a set of different proteins.</p>
      </sec>
    </sec>
    <sec id="s3" sec-type="materials|methods">
      <title>Materials and Methods</title>
      <sec id="s3a">
        <title>Benchmark Set</title>
        <p>The basis for the benchmark set is the PDBbind database. It contains a set of crystal structures of proteins complexed with small ligands, and the corresponding experimentally determined binding affinity. <xref ref-type="bibr" rid="pone.0052505-Wang2">[34]</xref>. Our analysis is based on release 2010. First, we aligned the sequences of all proteins in the database to each other, using the Needleman-Wunsch algorithm <xref ref-type="bibr" rid="pone.0052505-Needleman1">[39]</xref> as implemented in the EMBOSS suite <xref ref-type="bibr" rid="pone.0052505-Rice1">[40]</xref>. The proteins were then clustered with single linkage clustering, a link was assumed if the sequence identity was ≥95%. One cluster was assumed to contain structures of variants of the same protein with some mutations. Several descriptors were calculated for the protein-ligand complexes. If the crystal structure contains water molecules in the binding pocket, waters that have a high probability to play a role in binding were identified and counted. This was done with the tool W<sc>ater</sc>F<sc>inder</sc> included in CADDSuite <xref ref-type="bibr" rid="pone.0052505-Schumann1">[28]</xref>–<xref ref-type="bibr" rid="pone.0052505-Hildebrandt1">[41]</xref> that estimates the strength of binding of a water molecule observed in a crystal structure to the protein. The number of rotatable bonds in the ligand is used as a measure of ligand size and flexibility. The ligands of all proteins in a cluster were pairwise compared using ligand fingerprints as implemented in OpenBabel <xref ref-type="bibr" rid="pone.0052505-OBoyle1">[42]</xref> to measure their similarity and identity. For protein pairs of the same cluster with identical ligands, the pockets as defined by PDBbind were investigated for any mismatches corresponding to mutations. To identify suitable protein pairs, we searched our dataset for protein variants within a cluster that (1) have the same ligand bound, (2) contain at least one mutation in the binding pocket, (3) have no mutations elsewhere, (4) contain less than four water molecules potentially involved in binding, and (5) have a ligand with less than 15 rotatable bonds. As the results contained mostly single mutants, an additional search was performed looking for mutants with (1) at least two mutations in the pocket, (2) no mutations elsewhere, (3) allowing for less than 15 rotatable ligand bonds and (4) less than 7 potential binding waters molecules. The proteins identified by these searches were investigated further by visually inspecting their structure and looking at the corresponding literature. Suitable proteins were included in our set. Reasons for rejecting a protein were large conformational differences of the backbone in the binding pocket, the fact that affinity differences between variants is not caused by any protein-ligand interaction, but for example by changes in protein dynamics, and missing atoms of residues in the binding pocket in a crystal structure.</p>
      </sec>
      <sec id="s3b">
        <title>Design Pipeline PocketOptimizer</title>
        <p>A diagram of the P<sc>ocket</sc>O<sc>ptimizer</sc> workflow is shown in <xref ref-type="fig" rid="pone-0052505-g001">Figure 1</xref>. The backbone conformation of the protein stays fixed in the calculations, as do the side chain conformations of residues that do not contact the ligand or a residue that is mutated between variants. Amino acid side chain flexibility is sampled by a conformer library we compiled for this purpose <xref ref-type="bibr" rid="pone.0052505-Shetty1">[25]</xref>–<xref ref-type="bibr" rid="pone.0052505-Xiang1">[27]</xref>. For this, a set of high-quality protein structures from the PDB was selected by requiring a maximal resolution of 1.2 Å at least 40 residues, no CAVEAT record. Hydrogen atoms were added using reduce <xref ref-type="bibr" rid="pone.0052505-Word1">[43]</xref>. Side chain conformers of these structures were further filtered by requiring a temperature factor below 30, no alternative conformations and no overlaps with other atoms in the structure according to probe <xref ref-type="bibr" rid="pone.0052505-Word2">[44]</xref>. The conformers were superimposed at the backbone atoms and clustered as described in reference <xref ref-type="bibr" rid="pone.0052505-Boas1">[22]</xref>, resulting in 2211 conformers. The generation of ligand conformers and binding pocket poses also closely follows reference <xref ref-type="bibr" rid="pone.0052505-Boas1">[22]</xref>. Ligand conformers are created with <sc>omega</sc>2 by OpenEye Software <xref ref-type="bibr" rid="pone.0052505-Hawkins1">[45]</xref>. These are superimposed onto the ligand in the crystal structure, rotated around 6 approximately equally distributed axes through the ligand center of mass, and translated in x, y, z directions. The resulting ligand poses are filtered to exclude poses with obvious clashes with the protein backbone.</p>
        <p>Binding energy scores between protein and ligand are calculated by a receptor-ligand scoring function. The first one is contained in CADDSuite <xref ref-type="bibr" rid="pone.0052505-Schumann1">[28]</xref>. It is composed of terms for electrostatic, vdW, solvation and hydrogen bond energy scores. The second score used by P<sc>ocket</sc>O<sc>ptimizer</sc> is Autodock Vina <xref ref-type="bibr" rid="pone.0052505-Trott1">[29]</xref>. Protein packing energies are calculated using the AMBER force field <xref ref-type="bibr" rid="pone.0052505-Ponder1">[31]</xref> with electrostatics scaled by a factor of 0.01. In order to be compatible with the energy score optimization algorithm, the energy values have to be pairwise decomposable, i.e. of the form <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e005" xlink:type="simple"/></inline-formula>. <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e006" xlink:type="simple"/></inline-formula> are the self energies of the variables (side chain conformers or ligand poses), i.e. their inherent energies and the energies with the fixed protein parts, and <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e007" xlink:type="simple"/></inline-formula> the pairwise energies between the variables. As we are interested in improving binding affinity, we chose to upscale the binding energies by a factor of ten for CADDSuite scores and a factor of 100 for Autodock Vina scores to arrive at absolute values that are in the same range as the AMBER packing energies. The <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e008" xlink:type="simple"/></inline-formula> and <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0052505.e009" xlink:type="simple"/></inline-formula> energy tables are computed for all side chain conformers at the pocket positions and the ligand poses. The problem of finding the minimum energy conformation is formulated in graph-theroretic terms <xref ref-type="bibr" rid="pone.0052505-Kingsford1">[32]</xref> and solved using the MPLP algorithm by Sontag et al. <xref ref-type="bibr" rid="pone.0052505-Sontag1">[33]</xref>. The energy minimum identifies the best design with corresponding score values and conformation.</p>
        <p>P<sc>ocket</sc>O<sc>ptimizer</sc> is realized as a collection of binaries and scripts that perform the different subtasks. It was developed and tested on Ubuntu Linux 10.04 operating system. AMBER packing energy calculations are implemented in C++ using BALL <xref ref-type="bibr" rid="pone.0052505-Hildebrandt1">[41]</xref>, so is the ligand pose generation tool. Protein-ligand energies for CADDSuite are calculated with a scorer binary implemented in C++ as well, vina energies are calculated using the vina binary provided with the Autodock vina software distribution. The side chain conformer library contains the structures of the amino acid side chains in PDB and SDF formats. Several Python scripts are provided that interface between the different parts and allow a convenient conducting of a protein design task with the P<sc>ocket</sc>O<sc>ptimizer</sc> pipeline. Intermediate result are stored in standard file formats, SDF and PDB formats for structural data, and CSV files for energy tables. This allows the user to easily inspect this data with standard tools. It also facilitates the possibility to use a different approach for one of the modules, e.g. a different docking function, while the rest of the pipeline can remain unaltered.</p>
      </sec>
      <sec id="s3c">
        <title>Setup for PocketOptimizer Benchmark</title>
        <p>The protein structures were briefly minimized using C<sc>himera</sc>’s <xref ref-type="bibr" rid="pone.0052505-Pettersen1">[46]</xref> AMBER implementation. Amino acids of the binding pocket positions that were allowed to change conformations in the calculations had to have a distance smaller than 4 Å of at least one side chain atom to the ligand or to one of the residues that are mutable. Ligand conformers were rotated by ±20° around each axis and translated by 0.5 Å in each direction to create the ligand poses. If this resulted in more than 3000 poses, the conformers were filtered by similarity to the crystal structure conformation until meeting the max 3000 poses criterion. For proteins that contain metals in their binding pocket that are coordinated by the ligand, the ligand poses were filtered for poses that are geometrically compatible for coordination.</p>
      </sec>
      <sec id="s3d">
        <title>Rosetta Design Setup</title>
        <p>The R<sc>osetta</sc> enzyme design application as implemented in R<sc>osetta</sc> 3.3 <xref ref-type="bibr" rid="pone.0052505-Richter1">[30]</xref> was used with parameters closely following the relevant documentation. Protein structures were briefly minimized using the R<sc>osetta</sc> receptor preparation application provided for this task, generating ten resulting structures of which the one with the best energy was used for the design runs. Ligand conformers were generated using <sc>omega</sc>2, ligand charges added with the <sc>quacpac</sc> program of OpenEye software <xref ref-type="bibr" rid="pone.0052505-Hawkins1">[45]</xref>, and R<sc>osetta</sc> ligand params files generated with the provided molfile_to_params python script as included in the 3.3 distribution. No catalytic constraints were used for the enzyme design application runs, effectively making it a receptor design application. 1000 designs were created for every protein and every mutation on that protein with experimental affinity data in the test set. The best design was determined by the ranking scheme suggested in the documentation, it is the design with the best predicted binding energy among the designs with the 10% top total scores.</p>
      </sec>
    </sec>
    <sec id="s4">
      <title>Supporting Information</title>
      <supplementary-material id="pone.0052505.s001" mimetype="application/pdf" xlink:href="info:doi/10.1371/journal.pone.0052505.s001" position="float" xlink:type="simple">
        <label>Information S1</label>
        <caption>
          <p>(PDF)</p>
        </caption>
      </supplementary-material>
    </sec>
  </body>
  <back>
    <ref-list>
      <title>References</title>
      <ref id="pone.0052505-ValleBlisle1">
        <label>1</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Vallée-Bélisle</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Plaxco</surname><given-names>KW</given-names></name> (<year>2010</year>) <article-title>Structure-switching biosensors: inspired by nature</article-title>. <source>Curr Opin Struct Biol</source> <volume>20</volume>: <fpage>518</fpage>–<lpage>526</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Benson1">
        <label>2</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Benson</surname><given-names>DE</given-names></name>, <name name-style="western"><surname>Wisz</surname><given-names>MS</given-names></name>, <name name-style="western"><surname>Hellinga</surname><given-names>HW</given-names></name> (<year>2000</year>) <article-title>Rational design of nascent metalloenzymes</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>97</volume>: <fpage>6292</fpage>–<lpage>6297</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Bolon1">
        <label>3</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bolon</surname><given-names>DN</given-names></name>, <name name-style="western"><surname>Mayo</surname><given-names>SL</given-names></name> (<year>2001</year>) <article-title>Enzyme-like proteins by computational design</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>98</volume>: <fpage>14274</fpage>–<lpage>14279</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Rthlisberger1">
        <label>4</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Röthlisberger</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Khersonsky</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Wollacott</surname><given-names>AM</given-names></name>, <name name-style="western"><surname>Jiang</surname><given-names>L</given-names></name>, <name name-style="western"><surname>DeChancie</surname><given-names>J</given-names></name>, <etal>et al</etal>. (<year>2008</year>) <article-title>Kemp elimination catalysts by computational enzyme design</article-title>. <source>Nature</source> <volume>453</volume>: <fpage>190</fpage>–<lpage>195</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Korendovych1">
        <label>5</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Korendovych</surname><given-names>IV</given-names></name>, <name name-style="western"><surname>Kulp</surname><given-names>DW</given-names></name>, <name name-style="western"><surname>Wu</surname><given-names>Y</given-names></name>, <name name-style="western"><surname>Cheng</surname><given-names>H</given-names></name>, <name name-style="western"><surname>Roder</surname><given-names>H</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Design of a switchable eliminase</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>108</volume>: <fpage>6823</fpage>–<lpage>7</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Siegel1">
        <label>6</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Siegel</surname><given-names>JB</given-names></name>, <name name-style="western"><surname>Zanghellini</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Lovick</surname><given-names>HM</given-names></name>, <name name-style="western"><surname>Kiss</surname><given-names>G</given-names></name>, <name name-style="western"><surname>Lambert</surname><given-names>AR</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>Computational design of an enzyme catalyst for a stereoselective bimolecular diels-alder reaction</article-title>. <source>Science</source> <volume>329</volume>: <fpage>309</fpage>–<lpage>313</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Jiang1">
        <label>7</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Jiang</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Althoff</surname><given-names>EA</given-names></name>, <name name-style="western"><surname>Clemente</surname><given-names>FR</given-names></name>, <name name-style="western"><surname>Doyle</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Röthlisberger</surname><given-names>D</given-names></name>, <etal>et al</etal>. (<year>2008</year>) <article-title>De novo computational design of retro-aldol enzymes</article-title>. <source>Science</source> <volume>319</volume>: <fpage>1387</fpage>–<lpage>1391</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Khare1">
        <label>8</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Khare</surname><given-names>SD</given-names></name>, <name name-style="western"><surname>Kipnis</surname><given-names>Y</given-names></name>, <name name-style="western"><surname>Greisen</surname><given-names>PJ</given-names></name>, <name name-style="western"><surname>Takeuchi</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Ashani</surname><given-names>Y</given-names></name>, <etal>et al</etal>. (<year>2012</year>) <article-title>Computational redesign of a mononuclear zinc metalloenzyme for organophosphate hydrolysis</article-title>. <source>Nat Chem Biol</source> <volume>8</volume>: <fpage>294</fpage>–<lpage>300</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Murphy1">
        <label>9</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Murphy</surname><given-names>PM</given-names></name>, <name name-style="western"><surname>Bolducd</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Gallahere</surname><given-names>JL</given-names></name>, <name name-style="western"><surname>Stoddardd</surname><given-names>BL</given-names></name>, <name name-style="western"><surname>Baker</surname><given-names>D</given-names></name> (<year>2009</year>) <article-title>Alteration of enzyme specificity by computational loop remodeling and design</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>0</volume>: <fpage>00</fpage>–<lpage>00</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Chen1">
        <label>10</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Chen</surname><given-names>CY</given-names></name>, <name name-style="western"><surname>Georgiev</surname><given-names>I</given-names></name>, <name name-style="western"><surname>Anderson</surname><given-names>AC</given-names></name>, <name name-style="western"><surname>Donald</surname><given-names>BR</given-names></name> (<year>2009</year>) <article-title>Computational structure-based redesign of enzyme activity</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>106</volume>: <fpage>3764</fpage>–<lpage>3769</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Frey1">
        <label>11</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Frey</surname><given-names>KM</given-names></name>, <name name-style="western"><surname>Georgiev</surname><given-names>I</given-names></name>, <name name-style="western"><surname>Donald</surname><given-names>BR</given-names></name>, <name name-style="western"><surname>Anderson</surname><given-names>AC</given-names></name> (<year>2010</year>) <article-title>Predicting resistance mutations using protein design algorithms</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>107</volume>: <fpage>13707</fpage>–<lpage>13712</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Schreier1">
        <label>12</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Schreier</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Stumpp</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Wiesner</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Hocker</surname><given-names>B</given-names></name> (<year>2009</year>) <article-title>Computational design of ligand binding is not a solved problem</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>106</volume>: <fpage>18491</fpage>–<lpage>18496</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Baker1">
        <label>13</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Baker</surname><given-names>D</given-names></name> (<year>2010</year>) <article-title>An exciting but challenging road ahead for computational enzyme design</article-title>. <source>Protein Sci</source> <volume>19</volume>: <fpage>1817</fpage>–<lpage>1819</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Wang1">
        <label>14</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wang</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Althoff</surname><given-names>EA</given-names></name>, <name name-style="western"><surname>Bolduc</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Jiang</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Moody</surname><given-names>J</given-names></name>, <etal>et al</etal>. (<year>2012</year>) <article-title>Structural analyses of covalent enzyme-substrate analog complexes reveal strengths and limitations of de novo enzyme design</article-title>. <source>J Mol Biol</source> <volume>415</volume>: <fpage>615</fpage>–<lpage>625</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Morin1">
        <label>15</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Morin</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Kaufmann</surname><given-names>KW</given-names></name>, <name name-style="western"><surname>Fortenberry</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Harp</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Mizoue</surname><given-names>LS</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Computational design of an endo-1,4-beta-xylanase ligand binding site</article-title>. <source>Protein Eng Des Sel</source> <volume>24</volume>: <fpage>503</fpage>–<lpage>516</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Morin2">
        <label>16</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Morin</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Meiler</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Mizoue</surname><given-names>LS</given-names></name> (<year>2011</year>) <article-title>Computational design of protein-ligand interfaces: potential in therapeutic development</article-title>. <source>Trends Biotechnol</source> <volume>29</volume>: <fpage>159</fpage>–<lpage>66</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Plewczynski1">
        <label>17</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Plewczynski</surname><given-names>D</given-names></name>, <name name-style="western"><surname>’zniewski</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Augustyniak</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Ginalski</surname><given-names>K</given-names></name> (<year>2011</year>) <article-title>Can we trust docking results? evaluation of seven commonly used programs on pdbbind database</article-title>. <source>J Comput Chem</source> <volume>32</volume>: <fpage>742</fpage>–<lpage>755</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Cole1">
        <label>18</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cole</surname><given-names>JC</given-names></name>, <name name-style="western"><surname>Murray</surname><given-names>CW</given-names></name>, <name name-style="western"><surname>Nissink</surname><given-names>JWM</given-names></name>, <name name-style="western"><surname>Taylor</surname><given-names>RD</given-names></name>, <name name-style="western"><surname>Taylor</surname><given-names>R</given-names></name> (<year>2005</year>) <article-title>Comparing protein-ligand docking programs is difficult</article-title>. <source>Proteins</source> <volume>60</volume>: <fpage>325</fpage>–<lpage>32</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Zavodszky1">
        <label>19</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zavodszky</surname><given-names>MI</given-names></name>, <name name-style="western"><surname>Rohatgi</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Van</surname><given-names>VoorstJR</given-names></name>, <name name-style="western"><surname>Yan</surname><given-names>H</given-names></name>, <name name-style="western"><surname>Kuhn</surname><given-names>LA</given-names></name> (<year>2009</year>) <article-title>Scoring ligand similarity in structure-based virtual screening</article-title>. <source>J Mol Recognit</source> <volume>22</volume>: <fpage>280</fpage>–<lpage>92</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Perola1">
        <label>20</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Perola</surname><given-names>E</given-names></name>, <name name-style="western"><surname>Walters</surname><given-names>WP</given-names></name>, <name name-style="western"><surname>Charifson</surname><given-names>PS</given-names></name> (<year>2004</year>) <article-title>A detailed comparison of current docking and scoring methods on systems of pharmaceutical relevance</article-title>. <source>Proteins</source> <volume>56</volume>: <fpage>235</fpage>–<lpage>49</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Moult1">
        <label>21</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Moult</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Fidelis</surname><given-names>K</given-names></name>, <name name-style="western"><surname>Kryshtafovych</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Tramontano</surname><given-names>A</given-names></name> (<year>2011</year>) <article-title>Critical assessment of methods of protein structure prediction (casp) –round ix</article-title>. <source>Proteins</source> <volume>79</volume> Suppl 10<fpage>1</fpage>–<lpage>5</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Boas1">
        <label>22</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Boas</surname><given-names>FE</given-names></name>, <name name-style="western"><surname>Harbury</surname><given-names>PB</given-names></name> (<year>2008</year>) <article-title>Design of protein-ligand binding based on the molecular-mechanics energy model</article-title>. <source>J Mol Biol</source> <volume>380</volume>: <fpage>415</fpage>–<lpage>424</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Zanghellini1">
        <label>23</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zanghellini</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Jiang</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Wollacott</surname><given-names>AM</given-names></name>, <name name-style="western"><surname>Cheng</surname><given-names>G</given-names></name>, <name name-style="western"><surname>Meiler</surname><given-names>J</given-names></name>, <etal>et al</etal>. (<year>2006</year>) <article-title>New algorithms and an in silico benchmark for computational enzyme design</article-title>. <source>Protein Sci</source> <volume>15</volume>: <fpage>2785</fpage>–<lpage>94</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Malisi1">
        <label>24</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Malisi</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Kohlbacher</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Höcker</surname><given-names>B</given-names></name> (<year>2009</year>) <article-title>Automated scaffold selection for enzyme design</article-title>. <source>Proteins</source> <volume>77</volume>: <fpage>74</fpage>–<lpage>83</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Shetty1">
        <label>25</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shetty</surname><given-names>RP</given-names></name>, <name name-style="western"><surname>Bakker</surname><given-names>PIWD</given-names></name>, <name name-style="western"><surname>DePristo</surname><given-names>MA</given-names></name>, <name name-style="western"><surname>Blundell</surname><given-names>TL</given-names></name> (<year>2003</year>) <article-title>Advantages of fine-grained side chain conformer libraries</article-title>. <source>Protein Eng</source> <volume>16</volume>: <fpage>963</fpage>–<lpage>969</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Lassila1">
        <label>26</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lassila</surname><given-names>JK</given-names></name>, <name name-style="western"><surname>Privett</surname><given-names>HK</given-names></name>, <name name-style="western"><surname>Allen</surname><given-names>BD</given-names></name>, <name name-style="western"><surname>Mayo</surname><given-names>SL</given-names></name> (<year>2006</year>) <article-title>Combinatorial methods for small-molecule placement in computational enzyme design</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>103</volume>: <fpage>16710</fpage>–<lpage>16715</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Xiang1">
        <label>27</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Xiang</surname><given-names>Z</given-names></name>, <name name-style="western"><surname>Honig</surname><given-names>B</given-names></name> (<year>2001</year>) <article-title>Extending the accuracy limits of prediction for side-chain conformations</article-title>. <source>J Mol Biol</source> <volume>311</volume>: <fpage>421</fpage>–<lpage>430</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Schumann1">
        <label>28</label>
        <mixed-citation publication-type="other" xlink:type="simple">Schumann M (2012). Caddsuite 1.0. URL <ext-link ext-link-type="uri" xlink:href="http://caddsuite.github.com/" xlink:type="simple">http://caddsuite.github.com/</ext-link>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Trott1">
        <label>29</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Trott</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Olson</surname><given-names>AJ</given-names></name> (<year>2010</year>) <article-title>Autodock vina: improving the speed and accuracy of docking with a new scoring function, efficient optimization, and multithreading</article-title>. <source>J Comput Chem</source> <volume>31</volume>: <fpage>455</fpage>–<lpage>461</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Richter1">
        <label>30</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Richter</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Leaver-Fay</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Khare</surname><given-names>SD</given-names></name>, <name name-style="western"><surname>Bjelic</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Baker</surname><given-names>D</given-names></name> (<year>2011</year>) <article-title>De novo enzyme design using rosetta3</article-title>. <source>PLoS One</source> <volume>6</volume>: <fpage>e19230</fpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Ponder1">
        <label>31</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ponder</surname><given-names>JW</given-names></name>, <name name-style="western"><surname>Case</surname><given-names>DA</given-names></name> (<year>2003</year>) <article-title>Force fields for protein simulations</article-title>. <source>Adv Protein Chem</source> <volume>66</volume>: <fpage>27</fpage>–<lpage>85</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Kingsford1">
        <label>32</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kingsford</surname><given-names>CL</given-names></name>, <name name-style="western"><surname>Chazelle</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Singh</surname><given-names>M</given-names></name> (<year>2005</year>) <article-title>Solving and analyzing side-chain positioning problems using linear and integer programming</article-title>. <source>Bioinformatics</source> <volume>21</volume>: <fpage>1028</fpage>–<lpage>1036</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Sontag1">
        <label>33</label>
        <mixed-citation publication-type="other" xlink:type="simple">Sontag D, Meltzer T, Globerson A, Weiss Y, Jaakkola T (2008) Tightening LP relaxations for MAP using message-passing. In: 24th Conference in Uncertainty in Artificial Intelligence. AUAI Press, 503–510.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Wang2">
        <label>34</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wang</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Fang</surname><given-names>X</given-names></name>, <name name-style="western"><surname>Lu</surname><given-names>Y</given-names></name>, <name name-style="western"><surname>Yang</surname><given-names>CY</given-names></name>, <name name-style="western"><surname>Wang</surname><given-names>S</given-names></name> (<year>2005</year>) <article-title>The pdbbind database: methodologies and updates</article-title>. <source>J Med Chem</source> <volume>48</volume>: <fpage>4111</fpage>–<lpage>4119</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Murzin1">
        <label>35</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Murzin</surname><given-names>AG</given-names></name>, <name name-style="western"><surname>Brenner</surname><given-names>SE</given-names></name>, <name name-style="western"><surname>Hubbard</surname><given-names>T</given-names></name>, <name name-style="western"><surname>Chothia</surname><given-names>C</given-names></name> (<year>1995</year>) <article-title>Scop: a structural classification of proteins database for the investigation of sequences and structures</article-title>. <source>J Mol Biol</source> <volume>247</volume>: <fpage>536</fpage>–<lpage>540</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Georgiev1">
        <label>36</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Georgiev</surname><given-names>I</given-names></name>, <name name-style="western"><surname>Keedy</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Richardson</surname><given-names>JS</given-names></name>, <name name-style="western"><surname>Richardson</surname><given-names>DC</given-names></name>, <name name-style="western"><surname>Donald</surname><given-names>BR</given-names></name> (<year>2008</year>) <article-title>Algorithm for backrub motions in protein design</article-title>. <source>Bioinformatics</source> <volume>24</volume>: <fpage>i196</fpage>–<lpage>204</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Smith1">
        <label>37</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Smith</surname><given-names>CA</given-names></name>, <name name-style="western"><surname>Kortemme</surname><given-names>T</given-names></name> (<year>2008</year>) <article-title>Backrub-like backbone simulation recapitulates natural protein conformational variability and improves mutant side-chain prediction</article-title>. <source>J Mol Biol</source> <volume>380</volume>: <fpage>742</fpage>–<lpage>56</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Kellogg1">
        <label>38</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kellogg</surname><given-names>EH</given-names></name>, <name name-style="western"><surname>Leaver-Fay</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Baker</surname><given-names>D</given-names></name> (<year>2011</year>) <article-title>Role of conformational sampling in computing mutationinduced changes in protein structure and stability</article-title>. <source>Proteins</source> <volume>79</volume>: <fpage>830</fpage>–<lpage>8</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Needleman1">
        <label>39</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Needleman</surname><given-names>SB</given-names></name>, <name name-style="western"><surname>Wunsch</surname><given-names>CD</given-names></name> (<year>1970</year>) <article-title>A general method applicable to the search for similarities in the amino acid sequence of two proteins</article-title>. <source>J Mol Biol</source> <volume>48</volume>: <fpage>443</fpage>–<lpage>453</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Rice1">
        <label>40</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rice</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Longden</surname><given-names>I</given-names></name>, <name name-style="western"><surname>Bleasby</surname><given-names>A</given-names></name> (<year>2000</year>) <article-title>Emboss: the european molecular biology open software suite</article-title>. <source>Trends Genet</source> <volume>16</volume>: <fpage>276</fpage>–<lpage>277</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Hildebrandt1">
        <label>41</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hildebrandt</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Dehof</surname><given-names>AK</given-names></name>, <name name-style="western"><surname>Rurainski</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Bertsch</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Schumann</surname><given-names>M</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>Ball–biochemical algorithms library 1.3</article-title>. <source>BMC Bioinformatics</source> <volume>11</volume>: <fpage>531</fpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-OBoyle1">
        <label>42</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>O'Boyle</surname><given-names>NM</given-names></name>, <name name-style="western"><surname>Banck</surname><given-names>M</given-names></name>, <name name-style="western"><surname>James</surname><given-names>CA</given-names></name>, <name name-style="western"><surname>Morley</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Vandermeersch</surname><given-names>T</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Open babel: An open chemical toolbox</article-title>. <source>J Cheminform</source> <volume>3</volume>: <fpage>33</fpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Word1">
        <label>43</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Word</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Lovell</surname><given-names>SC</given-names></name>, <name name-style="western"><surname>Richardson</surname><given-names>JS</given-names></name>, <name name-style="western"><surname>Richardson</surname><given-names>DC</given-names></name> (<year>1999</year>) <article-title>Asparagine and glutamine: using hydrogen atom contacts in the choice of side-chain amide orientation</article-title>. <source>J Mol Biol</source> <volume>285</volume>: <fpage>1735</fpage>–<lpage>1747</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Word2">
        <label>44</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Word</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Lovell</surname><given-names>SC</given-names></name>, <name name-style="western"><surname>LaBean</surname><given-names>TH</given-names></name>, <name name-style="western"><surname>Taylor</surname><given-names>HC</given-names></name>, <name name-style="western"><surname>Zalis</surname><given-names>ME</given-names></name>, <etal>et al</etal>. (<year>1999</year>) <article-title>Visualizing and quantifying molecular goodness-of-fit: small-probe contact dots with explicit hydrogen atoms</article-title>. <source>J Mol Biol</source> <volume>285</volume>: <fpage>1711</fpage>–<lpage>1733</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Hawkins1">
        <label>45</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hawkins</surname><given-names>PCD</given-names></name>, <name name-style="western"><surname>Skillman</surname><given-names>AG</given-names></name>, <name name-style="western"><surname>Warren</surname><given-names>GL</given-names></name>, <name name-style="western"><surname>Ellingson</surname><given-names>BA</given-names></name>, <name name-style="western"><surname>Stahl</surname><given-names>MT</given-names></name> (<year>2010</year>) <article-title>Conformer generation with omega: algorithm and validation using high quality structures from the protein databank and cambridge structural database</article-title>. <source>J Chem Inf Model</source> <volume>50</volume>: <fpage>572</fpage>–<lpage>584</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0052505-Pettersen1">
        <label>46</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pettersen</surname><given-names>EF</given-names></name>, <name name-style="western"><surname>Goddard</surname><given-names>TD</given-names></name>, <name name-style="western"><surname>Huang</surname><given-names>CC</given-names></name>, <name name-style="western"><surname>Couch</surname><given-names>GS</given-names></name>, <name name-style="western"><surname>Greenblatt</surname><given-names>DM</given-names></name>, <etal>et al</etal>. (<year>2004</year>) <article-title>Ucsf chimera–a visualization system for exploratory research and analysis</article-title>. <source>J Comput Chem</source> <volume>25</volume>: <fpage>1605</fpage>–<lpage>1612</lpage>.</mixed-citation>
      </ref>
    </ref-list>
  </back>
</article>