<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="EN"><front><journal-meta><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="publisher">pcbi</journal-id><journal-id journal-id-type="allenpress-id">plcb</journal-id><journal-id journal-id-type="nlm-ta">PLoS Comput Biol</journal-id><journal-id journal-id-type="pmc">ploscomp</journal-id><!--===== Grouping journal title elements =====--><journal-title-group><journal-title>PLoS Computational Biology</journal-title></journal-title-group><issn pub-type="ppub">1553-734X</issn><issn pub-type="epub">1553-7358</issn><publisher><publisher-name>Public Library of Science</publisher-name><publisher-loc>San Francisco, USA</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.1371/journal.pcbi.0030182</article-id><article-id pub-id-type="publisher-id">07-PLCB-RA-0166R2</article-id><article-id pub-id-type="sici">plcb-03-09-13</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline"><subject>Computational Biology</subject></subj-group><subj-group subj-group-type="System Taxonomy"><subject>Saccharomyces</subject></subj-group></article-categories><title-group><article-title>Structure-Templated Predictions of Novel Protein Interactions from Sequence Information</article-title><alt-title alt-title-type="running-head">Protein Interaction Prediction</alt-title></title-group><contrib-group><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Betel</surname><given-names>Doron</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="fn" rid="n103"><sup>¤</sup></xref><xref ref-type="corresp" rid="cor1"><sup>*</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Breitkreuz</surname><given-names>Kevin E</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Isserlin</surname><given-names>Ruth</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Dewar-Darch</surname><given-names>Danielle</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Tyers</surname><given-names>Mike</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Hogue</surname><given-names>Christopher W. V</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib></contrib-group><aff id="aff1">
				<label>1</label><addr-line> Samuel Lunenfeld Research Institute, Mt. Sinai Hospital, Toronto, Ontario, Canada
			</addr-line></aff><aff id="aff2">
				<label>2</label><addr-line> Department of Biochemistry, University of Toronto, Toronto, Ontario, Canada
			</addr-line></aff><aff id="aff3">
				<label>3</label><addr-line> Department of Medical Genetics and Microbiology, University of Toronto, Toronto, Ontario, Canada
			</addr-line></aff><contrib-group><contrib contrib-type="editor" xlink:type="simple"><name name-style="western"><surname>Lai</surname><given-names>Luhua</given-names></name><role>Editor</role><xref ref-type="aff" rid="edit1"/></contrib></contrib-group><aff id="edit1">Peking University, China</aff><author-notes><fn fn-type="con" id="ack1"><p>DB and MT conceived and designed the experiments and wrote the paper. KEB and DDD performed the experiments. DB and RI analyzed the data. RI contributed reagents/materials/analysis tools. DB conceived and designed the project, and performed the computational work. MT and CWVH directed the study.</p></fn><fn fn-type="current-aff" id="n103"><p>¤ Current address: Computational and Systems Biology Center, Memorial Sloan-Kettering Cancer Center, New York, New York, United States of America</p></fn><corresp id="cor1">* To whom correspondence should be addressed. E-mail: <email xlink:type="simple">betel@cbio.mskcc.org</email></corresp><fn fn-type="conflict" id="ack3"><p> The authors have declared that no competing interests exist.</p></fn></author-notes><pub-date pub-type="ppub"><month>9</month><year>2007</year></pub-date><pub-date pub-type="epub"><day>21</day><month>9</month><year>2007</year></pub-date><volume>3</volume><issue>9</issue><elocation-id>e182</elocation-id><history><date date-type="received"><day>4</day><month>4</month><year>2007</year></date><date date-type="accepted"><day>2</day><month>8</month><year>2007</year></date></history><!--===== Grouping copyright info into permissions =====--><permissions><copyright-year>2007</copyright-year><copyright-holder>Betel et al</copyright-holder><license><license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions><abstract><p>The multitude of functions performed in the cell are largely controlled by a set of carefully orchestrated protein interactions often facilitated by specific binding of conserved domains in the interacting proteins. Interacting domains commonly exhibit distinct binding specificity to short and conserved recognition peptides called binding profiles. Although many conserved domains are known in nature, only a few have well-characterized binding profiles. Here, we describe a novel predictive method known as domain–motif interactions from structural topology (D-MIST) for elucidating the binding profiles of interacting domains. A set of domains and their corresponding binding profiles were derived from extant protein structures and protein interaction data and then used to predict novel protein interactions in yeast. A number of the predicted interactions were verified experimentally, including new interactions of the mitotic exit network, RNA polymerases, nucleotide metabolism enzymes, and the chaperone complex. These results demonstrate that new protein interactions can be predicted exclusively from sequence information.</p></abstract><abstract abstract-type="summary"><title>Author Summary</title><sec id="st1"><title/><p>Many functions performed within a living cell are mediated by specific interactions between proteins. Precise geometric and chemical matches between segments of the protein structures facilitate those interactions. Such binding surfaces are often evolutionarily conserved elements of protein structures known as conserved domains that recognize specific binding elements on the interacting proteins. Binding domains and their corresponding interacting profiles constitute basic interacting modules that are replicated in multiple protein pairs, where they mediate similar interactions. Although many conserved domains are identified, only a handful have known, well-characterized binding elements. This paper describes a computational method that aims to elucidate the binding specificity of many domains. The utility of the derived binding specificity is demonstrated by predicting new interactions between yeast proteins. The predictions are based solely on sequence information by identifying the conserved domains and their corresponding binding sequences. A number of the predicted interactions were confirmed experimentally, demonstrating the feasibility of this approach.</p></sec></abstract><funding-group><funding-statement>DB was supported by Ontario Graduate Scholarship, and KB was supported by a Canadian Institute of Health Research (CIHR) Training Grant. MT's research is supported by CIHR and Genome Canada; MT holds a Canada Research Chair in Bioinformatics and Functional Genomics. CWVH's research is funded by the Ontario R&amp;D Challenge Fund and by Genome Canada through the Ontario Genomics Institute.</funding-statement></funding-group><counts><page-count count="7"/></counts><!--===== Restructure custom-meta-wrap to custom-meta-group =====--><custom-meta-group><custom-meta><meta-name>citation</meta-name><meta-value>Betel D, Breitkreuz KE, Isserlin R, Dewar-Darch D, Tyers M, et al. (2007) Structure-templated predictions of novel protein interactions from sequence information. PLoS Comput Biol 3(9): e182. doi:<ext-link ext-link-type="doi" xlink:href="http://dx.doi.org/10.1371/journal.pcbi.0030182" xlink:type="simple">10.1371/journal.pcbi.0030182</ext-link></meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1"><title>Introduction</title><p>The interaction between two proteins is a geometric and electrostatic match between two polypeptide surfaces that results in a stable set of bonds between amino acid side chains or backbone atoms. The interacting amino acids are often part of conserved sequence features such as domains or short linear motifs that constitute the interaction site between the two proteins. Despite the increased coverage and sensitivity of experimental techniques for detecting protein interactions [<xref ref-type="bibr" rid="pcbi-0030182-b001">1</xref>–<xref ref-type="bibr" rid="pcbi-0030182-b006">6</xref>] (reviewed in [<xref ref-type="bibr" rid="pcbi-0030182-b007">7</xref>]), elucidating the precise interacting residues remains experimentally difficult. In most cases, all that is known about an interaction is the identity of the two interacting proteins, with little information about the underlying binding site. However, detailed knowledge of interaction specificity is important for understanding reaction mechanism, interaction prediction, and drug development.</p><p>Interacting domains are autonomous structural elements that exhibit distinct binding specificity to a multitude of target polypeptides. Such domains act as independent elements that can be “plugged” into a new protein and thereby introduce new functionality to the emerging protein [<xref ref-type="bibr" rid="pcbi-0030182-b008">8</xref>]. From an evolutionary perspective, such rearrangements and the multiplication of existing conserved domains is a likely mechanism by which organisms generate new proteins, pathways, and novel functionalities [<xref ref-type="bibr" rid="pcbi-0030182-b009">9</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b010">10</xref>]. Several protein interaction prediction methods exploit the conservation of protein-binding interfaces by identifying domain pairs that consistently co-occur in interacting proteins or coevolve, which are then used to predict new interactions [<xref ref-type="bibr" rid="pcbi-0030182-b011">11</xref>–<xref ref-type="bibr" rid="pcbi-0030182-b016">16</xref>]. Structure-based prediction methods use known protein complexes to model interactions between proteins that are homologous to the complex components [<xref ref-type="bibr" rid="pcbi-0030182-b017">17</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b018">18</xref>]. Other prediction methods use integrative approaches that incorporate interaction experiments with additional functional information such as correlated expression level, common functional annotation [<xref ref-type="bibr" rid="pcbi-0030182-b019">19</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b020">20</xref>], and cross-species comparisons [<xref ref-type="bibr" rid="pcbi-0030182-b021">21</xref>]. Alternative approaches attempt to identify correlated sequence motifs that represent generic interacting sequence elements that may or may not be components of conserved domains [<xref ref-type="bibr" rid="pcbi-0030182-b022">22</xref>–<xref ref-type="bibr" rid="pcbi-0030182-b025">25</xref>]. In a few limited cases, detailed experimental data are used to generate high-resolution definition of domain binding profiles; however, such information is available only for a small number of domains [<xref ref-type="bibr" rid="pcbi-0030182-b026">26</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b027">27</xref>].</p><p>Our primary objective is to predict interaction between proteins strictly from sequence information. Our approach is based on identifying the binding specificity of interacting domains that can then be used to predict new interactions. Here, we use existing physical interaction data to derive sequence profiles of the binding sequences that are presumed to determine the binding specificity of interacting domains. Our method, called domain–motif interactions from structural topology (D-MIST), is based on a two-step approach. First, potential domain-binding motifs are extracted from structural data. Second, these motifs are converted to sequence profiles in the form of position-specific scoring matrices (PSSMs). These PSSMs are derived using a subset of experimentally determined binary interactions that contain the domain of interest (<xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>). Gibbs sampling, seeded with the motif extracted from structural data, is used to generate a PSSM from similar sequences that occur in a subset of established interacting proteins. We used the domain-binding profiles to predict protein interactions in yeast. The predictions were compared to a hidden set of known interactions reported in the literature, and several predicted interactions were confirmed directly by in vivo coprecipitation experiments.</p><fig id="pcbi-0030182-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0030182.g001</object-id><label>Figure 1</label><caption><title>Outline of D-MIST Method for Predicting Protein Interactions by Learned Binding Profiles</title><p>Identification of domain-binding profiles begins by extracting the short sequence motifs from structural complexes that contain the domain of interest.</p><p>(A) In this example, RhoGAP-interacting motifs are extracted from two structural complexes (PDB ID 1AM4, 1TX4) where RhoGAP is bound to small G proteins.</p><p>(B) Protein interactions containing the RhoGAP domain were collected from four databases to form the learning set for the Gibbs sampling to generate the binding profiles (shown here as sequence logos [<xref ref-type="bibr" rid="pcbi-0030182-b057">57</xref>]). The sampling step is biased towards motifs that are similar to those found in the structural dataset.</p><p>(C) The resulting PSSMs are used to predict interactions for proteins with RhoGAP domains, such as the human ARHGAP1. A subset of the predicted interactions is subsequently tested by two experimental methods.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.g001" xlink:type="simple"/></fig></sec><sec id="s2"><title>Results</title><p>The library of 3-D structures of protein complexes contains a detailed description of the binding interfaces between interacting proteins that include atom contacts and residue side-chain interactions [<xref ref-type="bibr" rid="pcbi-0030182-b028">28</xref>]. Using more than 10,000 structural complexes, we identified the domains in the binding sites and extracted their associated sequence motifs on the opposing chain. Interacting residues were defined as two residues on opposite polypeptide chains separated by a maximum of 5 Å (<xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>A). On average, each domain had two spatially separated interacting sequence motifs per interaction. Most domains were present in multiple 3-D structures in a variety of conformations, resulting in varied interacting sequence motifs with different levels of similarities.</p><p>The binding specificity of a domain is determined by a combination of physiochemical properties and structural constraints at the binding site that can be satisfied by multiple variations of the consensus sequence motif [<xref ref-type="bibr" rid="pcbi-0030182-b029">29</xref>]. The interacting sequence motifs extracted from the protein structures represent a first approximation of the binding specificity of the interacting domains, but do not represent the full evolutionary variations of the residue–residue interactions available in one binding topology. A more informative representation of the possible motif variations is a sequence profile in the form of a PSSM that captures the compositional variance by assigning probabilities to each amino acid at each position. These sequence variations of the binding profiles can be learned from proteins that are known to interact through the same domain.</p><p>We collected a set of 87,894 nonredundant protein interactions from four databases containing binary protein interactions from multiple species. Interactions derived from structural studies were excluded to preclude self-identification, as well as high-throughput protein complexes identification experiments [<xref ref-type="bibr" rid="pcbi-0030182-b030">30</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>] (see <xref ref-type="sec" rid="s4">Methods</xref>). Gibbs sampling [<xref ref-type="bibr" rid="pcbi-0030182-b032">32</xref>] was used to learn the PSSM binding profiles for a specific domain by sampling positions in the set of proteins that interact with proteins that contain the domain of interest. The majority of the proteins in the learning set are assumed to interact through the common domain, and the generated PSSM will represent its binding profile (<xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>B). Gibbs sampling enables the incorporation of prior knowledge about the length and composition of the binding profiles. The motifs identified in the 3-D structural analysis were used as prior knowledge in seeding the profile detection step to bias the sampling towards similar sequence regions. The result is a set of sequence PSSMs that represent the binding profiles of the interacting domains (<xref ref-type="supplementary-material" rid="pcbi-0030182-se001">Text S1</xref>).</p><p>The learned PSSMs were used to predict interactions for 703 yeast proteins with domains for which we successfully derived binding profiles. A physical interaction was predicted between proteins containing interacting domains and proteins with one or more of the interacting profiles associated with those domains (<xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>C). A total of 18,459 interactions were predicted between 2,313 proteins (<xref ref-type="supplementary-material" rid="pcbi-0030182-sd001">Dataset S1</xref>). We compared the predicted interactions to a comprehensive list of physical and genetic yeast interactions extracted from the literature [<xref ref-type="bibr" rid="pcbi-0030182-b033">33</xref>] and found that 609 predicted interactions have reported experimental evidence (∼3%; <italic>p =</italic> 1.0 × 10<sup>−13</sup>; <xref ref-type="supplementary-material" rid="pcbi-0030182-sg001">Figure S1</xref>). We note that 591 predicted interactions were found in both the 87,894 set of interactions used for the PSSM derivation and in the set of yeast literature curated interactions (∼32,000). However, none of the 609 predicted interactions that have supporting evidence in the literature overlap with those common 591 interactions. We did not incorporate additional experimental information such as cellular localization, functional annotation, surface accessibility, or gene expression data that would likely improve our prediction accuracy given that our primary goal was to predict novel interactions exclusively from sequence information.</p><p>Experimental verification of a subset of the predicted interactions was performed by a one-step immunoaffinity purification of one of the two interaction partners, followed by mass spectrometric identification of associated proteins (IP-MS) as previously described [<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>]. The IP-MS method confirmed 37 predicted interactions, including 23 novel interactions (<xref ref-type="fig" rid="pcbi-0030182-g002">Figure 2</xref>). As a second means to experimentally verify our predictions, we immunoprecipitated one protein in the interacting pair, followed by antibody detection of the second protein (IP-western), also as described in [<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>]. The IP-western method reaffirmed five of the interactions confirmed by IP-MS (yellow edges; <xref ref-type="fig" rid="pcbi-0030182-g003">Figure 3</xref>) and identified an additional four novel interactions (green edges; <xref ref-type="fig" rid="pcbi-0030182-g003">Figure 3</xref>). We note that six interactions confirmed by the IP-MS approach were not detected by IP-western (red dashed edges; <xref ref-type="fig" rid="pcbi-0030182-g003">Figure 3</xref>); this discrepancy may be due either to nonspecific interactions detected by IP-MS or to interference of the second epitope tag with some interactions and/or expression levels in vivo. Of the 18 predictions that were tested by IP-western, nine novel interactions were confirmed, and a total of 30 new interactions were identified by both the IP-MS and IP-western methods.</p><fig id="pcbi-0030182-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0030182.g002</object-id><label>Figure 2</label><caption><title>Predicted Interactions Verified by IP-MS</title><p>Immunoaffinity purification of bait proteins complexes followed by mass spectrometry identification of associated proteins confirmed 37 predicted interactions. Predictions between proteins that were both co-purified with the tagged bait protein (i.e., both proteins were prey) were not considered validated. Proteins are coloured according to their Gene Ontology biological process annotation.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.g002" xlink:type="simple"/></fig><fig id="pcbi-0030182-g003" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0030182.g003</object-id><label>Figure 3</label><caption><title>Predicted Interactions Confirmed by Experiments or by Previously Published Results in the Primary Literature</title><p>Interactions are coloured according to their verification source. Dashed red lines are predictions that were confirmed by IP-MS but not confirmed by IP-western; dashed green lines are predictions that failed experimental validation by IP-western.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.g003" xlink:type="simple"/></fig><sec id="s2a"><title>Experimentally Confirmed Predictions</title><p>Among the experimentally confirmed predictions were interactions between the five components of the PRS complex, which together compose the 5-phosphoribosyl-1(a)-pyrophosphate synthetase enzyme (EC number 2.7.6.1). This complex is a key component in the production of the precursors for purine, pyrmidine, and pyridine nucleotides [<xref ref-type="bibr" rid="pcbi-0030182-b034">34</xref>]. An additional interaction was confirmed between the alcohol dehydrogenase (NADP<sup>+</sup>) Adh7 and Prs5, the latter being a member of the PRS complex. This result suggests a possible direct link between NADP/NADPH balance, which is controlled by Adh7 [<xref ref-type="bibr" rid="pcbi-0030182-b035">35</xref>], and the biosynthesis of the purine and pyrimidine precursors. A predicted interaction between the histone H2A protein Hta1 and God1, a component of the SWR-C protein complex that incorporates Htz1 into the chromatin, was also confirmed. Chromatin remodelling by the exchange of Hta1 with Htz1 is thought to induce chromatin restructuring that favours gene transcription, RNA polymerase II recruitment, and gene expression induction near silent heterochromatin [<xref ref-type="bibr" rid="pcbi-0030182-b036">36</xref>]. Another confirmed interaction is between a member of the HSP40 family (Apj1) with two HSP70 proteins (Ssa1, Ssa2). HSP40 family members form complexes with HSP70 chaperone proteins, which facilitate the folding of specific proteins at various cellular locations [<xref ref-type="bibr" rid="pcbi-0030182-b037">37</xref>]. We also identified new interactions between the RNA polymerase II subunit Rpb2 with Rpb10, which is a common subunit of all three RNA polymerases [<xref ref-type="bibr" rid="pcbi-0030182-b038">38</xref>]. Additional interaction was demonstrated between Rpc40, a known shared subunit of RNA polymerases I and III, and Rpb2, an exclusive component of RNA polymerase II. It is possible that some of these interactions are bridged or stabilized by other RNA polymerase subunits [<xref ref-type="bibr" rid="pcbi-0030182-b039">39</xref>].</p><p>One might argue that the above successful predictions could be easily predicted from the orthology of the interacting proteins to the structural complexes used, such as the interactions between members of the PRS complex. We therefore tested several nonobvious predicted interactions that cannot be easily inferred from structural or sequence homology to other interacting pairs. The critical downstream effector of the mitotic exit network is the phosphatase Cdc14, which activates Clb degradation and Sic1 accumulation by dephosphorylation of key substrates [<xref ref-type="bibr" rid="pcbi-0030182-b040">40</xref>]. We confirmed an unexpected predicted interaction between Cdc14 and the protein kinase Cbk1, which functions in a parallel pathway (called RAM [regulation of Ace2p activity and cellular morphogenesis]) at the end of mitosis to facilitate cytokinesis and mother–daughter abscission [<xref ref-type="bibr" rid="pcbi-0030182-b041">41</xref>]. The Cdc14–Cbk1 interaction suggests that the activity of the mitotic exit network and RAM pathways may be coordinated via Cdc14-mediated dephosphorylation of RAM components and/or Cbk1-mediated phosphorylation of mitotic exit network components [<xref ref-type="bibr" rid="pcbi-0030182-b042">42</xref>]. Other nonobvious interactions between known components of clathrin-associated (AP-1) complex Apm1 and Apl2, as well as between components of the RNA splicing complex Smd2 and Lsm2, were detected by the IP-MS experiments but not by IP-western under the conditions used. Given the strength of the D-MIST predictions for these latter interactions, further investigation using more sensitive reagents seems warranted. These confirmed predictions of nonobvious interactions illustrate the potential of the D-MIST approach to generate new biological hypotheses.</p></sec></sec><sec id="s3"><title>Discussion</title><p>As noted previously, we excluded additional experimental evidence, such as localization and expression data from our prediction method. Although additional experimental information and functional annotation would likely improve prediction accuracy, it may also limit predictions only to those proteins with prior experimental or functional information. In addition, the use of functional annotation such as Gene Ontology terms (assigned by human experts or predicted computationally) in a prediction method will penalize predicted interactions between proteins with unrelated functions. Therefore, it restricts the ability to predict interactions between apparently unrelated proteins that could illuminate new cellular functions [<xref ref-type="bibr" rid="pcbi-0030182-b043">43</xref>].</p><p>The D-MIST method for identifying domain-binding modules is currently limited in a number of ways. The first limitation is the availability of detailed binding information, as attained primarily through structural studies and peptide-based approaches such as phage display [<xref ref-type="bibr" rid="pcbi-0030182-b044">44</xref>] and random peptide libraries [<xref ref-type="bibr" rid="pcbi-0030182-b045">45</xref>]. In addition, several studies have concluded that the repertoire of protein structures in the Protein Data Bank is significantly biased in that <italic>trans</italic>-membrane and disordered domains are underrepresented due to limitations in structure determination [<xref ref-type="bibr" rid="pcbi-0030182-b046">46</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b047">47</xref>]. Consequently, D-MIST analysis that depends on structural representation of protein interactions is similarly biased. The existing detailed examples of interactions are therefore sparse and noncomprehensive, with only a small subset of all possible domains that is represented. The second limitation is that the derived motifs do not represent the entire repertoire of all possible domain-binding sequences, even for those domains where structural data exist. The third limitation arises from the statistical framework of the Gibbs sampling method that requires a sufficient number of proteins to sample from in order to converge towards a meaningful PSSM. We restricted the analysis to domains with five or more putative interactors, thereby excluding domains that are infrequently found in our set of protein interactions. Fourth, some domains are not amendable to this type of analysis due to the diverse nature of their binding motifs that lack sequence conservation [<xref ref-type="bibr" rid="pcbi-0030182-b029">29</xref>]. Last, many interactions are governed by posttranslational modifications or precise physiological states, which may also hamper the accuracy of D-MIST predictions. Despite the above limitations, we have shown that novel protein interactions can be predicted strictly from primary sequence information. D-MIST not only predicts interactions between proteins but also provides sequence level predictions about the binding sites that can be verified experimentally. Predicting protein interactions without the need for additional information or prior experiments is particularly valuable when studying uncharacterized proteins and for predicting interactions in poorly studied organisms where typically only sequence information and predicted open reading frames are available. The sole dependence on sequence information allows for interaction prediction in other organisms without further modifications to the method or input datasets. With the advent of structural genomics initiatives [<xref ref-type="bibr" rid="pcbi-0030182-b048">48</xref>], the power of the D-MIST approach will certainly increase.</p></sec><sec id="s4"><title>Methods</title><sec id="s4a"><title>Extracting motifs.</title><p>The domain-binding motifs were extracted from BIND protein interaction records that were generated from 10,064 structures [<xref ref-type="bibr" rid="pcbi-0030182-b028">28</xref>]. Interactions were filtered for crystal-packing artifacts using the PQS server [<xref ref-type="bibr" rid="pcbi-0030182-b049">49</xref>], and all the interactions are available as a subset of the BIND database. Domain annotation was assigned to the protein structures using our in-house adaptation of CDD [<xref ref-type="bibr" rid="pcbi-0030182-b050">50</xref>] with an e-value cutoff of 10 × 10<sup>−6</sup> and then converted to InterPro identifiers [<xref ref-type="bibr" rid="pcbi-0030182-b051">51</xref>]. Binding motifs are defined as polypeptide segments of five residues or longer in which the amino acids side chains are &lt;5 Å from the interacting domain's side chains on the opposing protein. Two motif residues that are in direct contact with the interacting domain can be separated by a maximum of two noncontacting residues. For example, the first motifs in <xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>A contain a tyrosine and an arginine that are within 5 Å from the side chains of the RhoGAP domain separated by a distal residue, marked by X, that is not within contact range with the RhoGAP domain.</p></sec><sec id="s4b"><title>Learning the binding modules.</title><p>A total of 87,894 nonredundant protein interactions were collected from 204 species from four database sources: BIND [<xref ref-type="bibr" rid="pcbi-0030182-b052">52</xref>], DIP [<xref ref-type="bibr" rid="pcbi-0030182-b053">53</xref>], Mint [<xref ref-type="bibr" rid="pcbi-0030182-b054">54</xref>], and IntAct [<xref ref-type="bibr" rid="pcbi-0030182-b055">55</xref>]. We excluded all interactions that were derived from 3-D studies, high-throughput protein complex identification studies [<xref ref-type="bibr" rid="pcbi-0030182-b030">30</xref>,<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>], or interactions inferred from synthetic lethal experiments. The interactions were indexed in a relational database by domain annotation such that a single query can provide the full list of proteins that interact with a domain of interest (<xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>B). We used Gibbs sampling [<xref ref-type="bibr" rid="pcbi-0030182-b032">32</xref>] seeded with sequence motifs identified in the structural studies to compute a PSSM using the subset of pairwise protein interactions that contain the domain to which the motif was bound in the 3-D structure. The length of the structural motifs was used to approximate the length of the PSSMs. The frequency of residue <italic>j</italic> at position <italic>i</italic> in the PSSM (the <italic>i,j</italic> entry in the matrix) is computed as follows:
					<disp-formula id="pcbi-0030182-e001"><graphic mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.0030182.e001" xlink:type="simple"/><!-- <mml:math display='block'><mml:mrow><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&equals;</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mi>c</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&plus;</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mo>&plus;</mml:mo><mml:mi>B</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:math> --></disp-formula>where <italic>c<sub>i,j</sub></italic> is the observed counts of residue <italic>j</italic> at position <italic>i</italic> in the sampled proteins, <italic>b<sub>j</sub></italic> is pseudocounts for residue <italic>j</italic>, <italic>N</italic> is the number of sequences sampled, and <italic>B</italic> is the total number of pseudocounts for all residues. By increasing the pseudocount term (<italic>b<sub>j</sub></italic>) for specific positions in the PSSM, the sampling algorithm is biased to favour positions where the residue at position <italic>i</italic> in the sampled protein is similar to the residue at position <italic>i</italic> of the structural motif. We set the pseudocounts to equal 62% of the residue counts in the sampled proteins.
				</p></sec><sec id="s4c"><title>Predicting new interactions.</title><p>Two proteins were predicted to interact if one protein had a domain and a second protein matched one or more of the binding profiles for that domain (<xref ref-type="fig" rid="pcbi-0030182-g001">Figure 1</xref>C). We attempted to predict interactions between all yeast proteins by searching for domain-binding profiles as described in [<xref ref-type="bibr" rid="pcbi-0030182-b056">56</xref>] using PSSMs with a score cutoff &gt;10.0 (as scored by the Gibbs sampler) and a cutoff &gt;0.20 for the match between the PSSM and the protein. Potential interactors among the yeast proteome were identified for 703 domain-containing proteins with derived binding profiles. In total, 18,459 interactions were predicted between 2,313 proteins based on the presence of a domain and its binding profile in the interacting pair.</p></sec><sec id="s4d"><title>Experimental verification.</title><p>Recombination-based cloning, culture growth, and protein complex isolation were performed essentially as described [<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>] with minor modifications. Each uncharacterized open reading frame was tagged at the 3′-end with the FLAG-tag epitope using the Gateway recombination-based cloning system (Invitrogen, <ext-link ext-link-type="uri" xlink:href="http://www.invitrogen.com" xlink:type="simple">http://www.invitrogen.com</ext-link>). Bait complexes were immunopurified on anti-FLAG M2 antibody resin, resolved by denaturing gel electrophoresis, and visualized by colloidal Coomassie stain. Protein identification by automated liquid chromatography tandem mass spectrometry on a Finnigan LCQ DECA ion trap (Thermo Finnigan, <ext-link ext-link-type="uri" xlink:href="http://www.thermo.com" xlink:type="simple">http://www.thermo.com</ext-link>) mass spectrometer was as described previously [<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>]. Predicted protein interactions were also confirmed by IP-western [<xref ref-type="bibr" rid="pcbi-0030182-b031">31</xref>] using interaction partners tagged either as C-terminal HA or Myc<sub>3</sub> epitope fusions and detection with 12CA5 anti-HA or 9E10 anti-Myc monoclonal antibodies, respectively (<xref ref-type="supplementary-material" rid="pcbi-0030182-sg002">Figure S2</xref>).</p></sec><sec id="s4e"><title>Overlap with literature.</title><p>The predicted interactions were compared to a new set of yeast curated interactions collected from more than 50,000 abstracts and publications [<xref ref-type="bibr" rid="pcbi-0030182-b033">33</xref>] (available at <ext-link ext-link-type="uri" xlink:href="http://www.thebiogrid.org" xlink:type="simple">www.thebiogrid.org</ext-link>). The probability of the observed overlap between the predicted interactions and the literature curated is approximated by a Poisson distribution. A random variable <italic>Y</italic> has a Poisson distribution if
					<disp-formula id="pcbi-0030182-e002"><graphic mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.0030182.e002" xlink:type="simple"/><!-- <mml:math display='block'><mml:mrow><mml:mi>P</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mi>y</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>&equals;</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mi>e</mml:mi><mml:mrow><mml:mo>&minus;</mml:mo><mml:mi>&lambda;</mml:mi></mml:mrow></mml:msup><mml:msup><mml:mi>&lambda;</mml:mi><mml:mi>y</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mi>y</mml:mi><mml:mo>!</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:math> --></disp-formula>where <italic>λ</italic> = <italic>Np</italic>, <italic>N</italic> is the sample size, and <italic>p</italic> is the probability of a single event; i.e., the probability of selecting a true interaction by random chance. In the current analysis, <italic>N</italic> is the number of predicted interactions (18,459), <italic>y</italic> is the number of literature-validated predictions (609), and <italic>p</italic> is the probability of predicting a correct interaction by random chance for the 703 proteins for which interactions were predicted. The value of <italic>p</italic> is approximated as the frequency of true interactions among all possible protein pairs that were considered. Since there is no known complete set of interactions for any reference organism, we cautiously assume an upper bound of 100 physiological interactions per bait protein. This number is likely an order of magnitude larger than the true value. Potential interactors for the 703 proteins containing domains with derived binding profiles were identified by scanning the entire yeast proteome (∼6,000 proteins) for proteins that matched the domains binding profiles. Hence, the total number of proteins pairs that were considered (i.e., the entire search space) is 703 × 6,000. The value of <italic>p</italic> is then <inline-formula id="pcbi-0030182-ex001"><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pcbi.0030182.ex001" xlink:type="simple"/></inline-formula>
					. Given these parameters <italic>P</italic> (<italic>y</italic> ≥ 609) under a Poisson distribution is 1.0 × 10<sup>−13</sup>. Similar calculation using a hypergeometric distribution (sampling without replacement) yields a <italic>p</italic>-value of 1.0 × 10<sup>−8</sup>.
				</p></sec></sec><sec id="s5"><title>Supporting Information</title><supplementary-material id="pcbi-0030182-sd001" mimetype="application/zip" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.sd001" xlink:type="simple"><label>Dataset S1</label><caption><title>Cytoscape Session File Containing the Validated and Predicted Protein Interactions</title><p>A Cytoscape session file containing the complete set of predicted interactions as well as the networks in <xref ref-type="fig" rid="pcbi-0030182-g002">Figures 2</xref>, <xref ref-type="fig" rid="pcbi-0030182-g003">3</xref>, <xref ref-type="supplementary-material" rid="pcbi-0030182-sg001">S1</xref>, and <xref ref-type="supplementary-material" rid="pcbi-0030182-sg001">S2</xref>. The networks can be viewed using the Cytoscape network visualization tool freely available at <ext-link ext-link-type="uri" xlink:href="http://www.cytoscape.org" xlink:type="simple">http://www.cytoscape.org</ext-link>.</p><p>(2.0 MB ZIP)</p></caption></supplementary-material><supplementary-material id="pcbi-0030182-sg001" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.sg001" xlink:type="simple"><label>Figure S1</label><caption><title>The Overlap between the Predicted Interaction Network and a Comprehensive Set of Literature-Curated Interactions [<xref ref-type="bibr" rid="pcbi-0030182-b033">33</xref>]</title><p>The predicted interactions were compared to a new and exhaustive set of curated interactions extracted from the literature that includes physical interactions from both high-throughput and directed studies as well as genetic interactions. The overlap contains 609 interactions that represent ∼3% of the predicted interactions. Proteins are coloured according to Gene Ontology biological process annotation.</p><p>(519 KB PDF)</p></caption></supplementary-material><supplementary-material id="pcbi-0030182-sg002" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.sg002" xlink:type="simple"><label>Figure S2</label><caption><title>IP-Western Results for the Novel Interactions Predicted by D-MIST</title><p>Bait proteins were purified using FLAG antibodies, and their interacting proteins were detected by antibodies specific to C-terminal HA or Myc3 epitopes.</p><p>(325 KB PDF)</p></caption></supplementary-material><supplementary-material id="pcbi-0030182-se001" mimetype="text/plain" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0030182.sd002" xlink:type="simple"><label>Text S1</label><caption><title>The Domain-Binding Profiles Derived by D-MIST</title><p>Each domain-binding profile is specified as a list of sequence motifs. The sequence motifs are used as input to a PSSM search program [<xref ref-type="bibr" rid="pcbi-0030182-b056">56</xref>]. Source code available at <ext-link ext-link-type="uri" xlink:href="http://www.people.fas.harvard.edu/~junliu/index1.html#Computational_Biology" xlink:type="simple">http://www.people.fas.harvard.edu/~junliu/index1.html#Computational_Biology</ext-link>.</p><p>(2.7 MB TXT)</p></caption></supplementary-material></sec></body><back><ack><p>We thank Mai Vo, Brett Larsen, Pavel Metalnikov, and Howard Feldman for technical assistance.</p></ack><glossary><title>Abbreviations</title><def-list><def-item><term>D-MIST</term><def><p>domain–motif interactions from structural topology</p></def></def-item><def-item><term>IP-MS</term><def><p>immunoprecipitation followed by mass spectrometry</p></def></def-item><def-item><term>IP-western</term><def><p>immunoprecipitation followed by Western blotting</p></def></def-item><def-item><term>PSSM</term><def><p>position-specific scoring matrix</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="pcbi-0030182-b001"><label>1</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Gavin</surname><given-names>AC</given-names></name><name name-style="western"><surname>Aloy</surname><given-names>P</given-names></name><name name-style="western"><surname>Grandi</surname><given-names>P</given-names></name><name name-style="western"><surname>Krause</surname><given-names>R</given-names></name><name name-style="western"><surname>Boesche</surname><given-names>M</given-names></name><etal/></person-group>
					<year>2006</year>
					<article-title>Proteome survey reveals modularity of the yeast cell machinery.</article-title>
					<source>Nature</source>
					<volume>440</volume>
					<fpage>631</fpage>
					<lpage>636</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b002"><label>2</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Jones</surname><given-names>RB</given-names></name><name name-style="western"><surname>Gordus</surname><given-names>A</given-names></name><name name-style="western"><surname>Krall</surname><given-names>JA</given-names></name><name name-style="western"><surname>MacBeath</surname><given-names>G</given-names></name></person-group>
					<year>2006</year>
					<article-title>A quantitative protein interaction network for the ErbB receptors using protein microarrays.</article-title>
					<source>Nature</source>
					<volume>439</volume>
					<fpage>168</fpage>
					<lpage>174</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b003"><label>3</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Ptacek</surname><given-names>J</given-names></name><name name-style="western"><surname>Devgan</surname><given-names>G</given-names></name><name name-style="western"><surname>Michaud</surname><given-names>G</given-names></name><name name-style="western"><surname>Zhu</surname><given-names>H</given-names></name><name name-style="western"><surname>Zhu</surname><given-names>X</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>Global analysis of protein phosphorylation in yeast.</article-title>
					<source>Nature</source>
					<volume>438</volume>
					<fpage>679</fpage>
					<lpage>684</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b004"><label>4</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Rual</surname><given-names>JF</given-names></name><name name-style="western"><surname>Venkatesan</surname><given-names>K</given-names></name><name name-style="western"><surname>Hao</surname><given-names>T</given-names></name><name name-style="western"><surname>Hirozane-Kishikawa</surname><given-names>T</given-names></name><name name-style="western"><surname>Dricot</surname><given-names>A</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>Towards a proteome-scale map of the human protein–protein interaction network.</article-title>
					<source>Nature</source>
					<volume>437</volume>
					<fpage>1173</fpage>
					<lpage>1178</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b005"><label>5</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Stelzl</surname><given-names>U</given-names></name><name name-style="western"><surname>Worm</surname><given-names>U</given-names></name><name name-style="western"><surname>Lalowski</surname><given-names>M</given-names></name><name name-style="western"><surname>Haenig</surname><given-names>C</given-names></name><name name-style="western"><surname>Brembeck</surname><given-names>FH</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>A human protein–protein interaction network: A resource for annotating the proteome.</article-title>
					<source>Cell</source>
					<volume>122</volume>
					<fpage>957</fpage>
					<lpage>968</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b006"><label>6</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Uetz</surname><given-names>P</given-names></name><name name-style="western"><surname>Dong</surname><given-names>YA</given-names></name><name name-style="western"><surname>Zeretzke</surname><given-names>C</given-names></name><name name-style="western"><surname>Atzler</surname><given-names>C</given-names></name><name name-style="western"><surname>Baiker</surname><given-names>A</given-names></name><etal/></person-group>
					<year>2006</year>
					<article-title>Herpesviral protein networks and their interaction with the human proteome.</article-title>
					<source>Science</source>
					<volume>311</volume>
					<fpage>239</fpage>
					<lpage>242</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b007"><label>7</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Shoemaker</surname><given-names>BA</given-names></name><name name-style="western"><surname>Panchenko</surname><given-names>AR</given-names></name></person-group>
					<year>2007</year>
					<article-title>Deciphering protein–protein interactions. Part I. Experimental techniques and databases.</article-title>
					<source>PLoS Comp Biol</source>
					<volume>3</volume>
					<elocation-id>e42</elocation-id>
				</element-citation></ref><ref id="pcbi-0030182-b008"><label>8</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Pawson</surname><given-names>T</given-names></name><name name-style="western"><surname>Nash</surname><given-names>P</given-names></name></person-group>
					<year>2003</year>
					<article-title>Assembly of cell regulatory systems through protein interaction domains.</article-title>
					<source>Science</source>
					<volume>300</volume>
					<fpage>445</fpage>
					<lpage>452</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b009"><label>9</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Dueber</surname><given-names>JE</given-names></name><name name-style="western"><surname>Yeh</surname><given-names>BJ</given-names></name><name name-style="western"><surname>Bhattacharyya</surname><given-names>RP</given-names></name><name name-style="western"><surname>Lim</surname><given-names>WA</given-names></name></person-group>
					<year>2004</year>
					<article-title>Rewiring cell signaling: The logic and plasticity of eukaryotic protein circuitry.</article-title>
					<source>Curr Opin Struct Biol</source>
					<volume>14</volume>
					<fpage>690</fpage>
					<lpage>699</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b010"><label>10</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Scott</surname><given-names>JD</given-names></name><name name-style="western"><surname>Pawson</surname><given-names>T</given-names></name></person-group>
					<year>2000</year>
					<article-title>Cell communication: The inside story.</article-title>
					<source>Sci Am</source>
					<volume>282</volume>
					<fpage>72</fpage>
					<lpage>79</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b011"><label>11</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>M</given-names></name><name name-style="western"><surname>Mehta</surname><given-names>S</given-names></name><name name-style="western"><surname>Sun</surname><given-names>F</given-names></name><name name-style="western"><surname>Chen</surname><given-names>T</given-names></name></person-group>
					<year>2002</year>
					<article-title>Inferring domain–domain interactions from protein–protein interactions.</article-title>
					<source>Genome Res</source>
					<volume>12</volume>
					<fpage>1540</fpage>
					<lpage>1548</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b012"><label>12</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Ng</surname><given-names>SK</given-names></name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names></name><name name-style="western"><surname>Tan</surname><given-names>SH</given-names></name><name name-style="western"><surname>Lin</surname><given-names>K</given-names></name></person-group>
					<year>2003</year>
					<article-title>InterDom: A database of putative interacting protein domains for validating predicted protein interactions and complexes.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>31</volume>
					<fpage>251</fpage>
					<lpage>254</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b013"><label>13</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Riley</surname><given-names>R</given-names></name><name name-style="western"><surname>Lee</surname><given-names>C</given-names></name><name name-style="western"><surname>Sabatti</surname><given-names>C</given-names></name><name name-style="western"><surname>Eisenberg</surname><given-names>D</given-names></name></person-group>
					<year>2005</year>
					<article-title>Inferring protein domain interactions from databases of interacting proteins.</article-title>
					<source>Genome Biol</source>
					<volume>6</volume>
					<fpage>R89</fpage>
				</element-citation></ref><ref id="pcbi-0030182-b014"><label>14</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Sprinzak</surname><given-names>E</given-names></name><name name-style="western"><surname>Margalit</surname><given-names>H</given-names></name></person-group>
					<year>2001</year>
					<article-title>Correlated sequence-signatures as markers of protein–protein interaction.</article-title>
					<source>J Mol Biol</source>
					<volume>311</volume>
					<fpage>681</fpage>
					<lpage>692</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b015"><label>15</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names></name><name name-style="western"><surname>Liu</surname><given-names>N</given-names></name><name name-style="western"><surname>Zhao</surname><given-names>H</given-names></name></person-group>
					<year>2005</year>
					<article-title>Inferring protein–protein interactions through high-throughput interaction data from diverse organisms.</article-title>
					<source>Bioinformatics</source>
					<volume>21</volume>
					<fpage>3279</fpage>
					<lpage>3285</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b016"><label>16</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Guimaraes</surname><given-names>KS</given-names></name><name name-style="western"><surname>Jothi</surname><given-names>R</given-names></name><name name-style="western"><surname>Zotenko</surname><given-names>E</given-names></name><name name-style="western"><surname>Przytycka</surname><given-names>TM</given-names></name></person-group>
					<year>2006</year>
					<article-title>Predicting domain–domain interactions using a parsimony approach.</article-title>
					<source>Genome Biol</source>
					<volume>7</volume>
					<fpage>R104</fpage>
				</element-citation></ref><ref id="pcbi-0030182-b017"><label>17</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Aloy</surname><given-names>P</given-names></name><name name-style="western"><surname>Bottcher</surname><given-names>B</given-names></name><name name-style="western"><surname>Ceulemans</surname><given-names>H</given-names></name><name name-style="western"><surname>Leutwein</surname><given-names>C</given-names></name><name name-style="western"><surname>Mellwig</surname><given-names>C</given-names></name><etal/></person-group>
					<year>2004</year>
					<article-title>Structure-based assembly of protein complexes in yeast.</article-title>
					<source>Science</source>
					<volume>303</volume>
					<fpage>2026</fpage>
					<lpage>2029</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b018"><label>18</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>L</given-names></name><name name-style="western"><surname>Arakaki</surname><given-names>AK</given-names></name><name name-style="western"><surname>Lu</surname><given-names>H</given-names></name><name name-style="western"><surname>Skolnick</surname><given-names>J</given-names></name></person-group>
					<year>2003</year>
					<article-title>Multimeric threading-based prediction of protein–protein interactions on a genomic scale: Application to the <named-content content-type="genus-species" xlink:type="simple">Saccharomyces cerevisiae</named-content> proteome.</article-title>
					<source>Genome Res</source>
					<volume>13</volume>
					<fpage>1146</fpage>
					<lpage>1154</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b019"><label>19</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Jansen</surname><given-names>R</given-names></name><name name-style="western"><surname>Yu</surname><given-names>H</given-names></name><name name-style="western"><surname>Greenbaum</surname><given-names>D</given-names></name><name name-style="western"><surname>Kluger</surname><given-names>Y</given-names></name><name name-style="western"><surname>Krogan</surname><given-names>NJ</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>A Bayesian networks approach for predicting protein–protein interactions from genomic data.</article-title>
					<source>Science</source>
					<volume>302</volume>
					<fpage>449</fpage>
					<lpage>453</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b020"><label>20</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Rhodes</surname><given-names>DR</given-names></name><name name-style="western"><surname>Tomlins</surname><given-names>SA</given-names></name><name name-style="western"><surname>Varambally</surname><given-names>S</given-names></name><name name-style="western"><surname>Mahavisno</surname><given-names>V</given-names></name><name name-style="western"><surname>Barrette</surname><given-names>T</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>Probabilistic model of the human protein–protein interaction network.</article-title>
					<source>Nat Biotechnol</source>
					<volume>23</volume>
					<fpage>951</fpage>
					<lpage>959</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b021"><label>21</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Sharan</surname><given-names>R</given-names></name><name name-style="western"><surname>Suthram</surname><given-names>S</given-names></name><name name-style="western"><surname>Kelley</surname><given-names>RM</given-names></name><name name-style="western"><surname>Kuhn</surname><given-names>T</given-names></name><name name-style="western"><surname>McCuine</surname><given-names>S</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>Conserved patterns of protein interaction in multiple species.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>102</volume>
					<fpage>1974</fpage>
					<lpage>1979</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b022"><label>22</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>H</given-names></name><name name-style="western"><surname>Li</surname><given-names>J</given-names></name><name name-style="western"><surname>Tan</surname><given-names>SH</given-names></name><name name-style="western"><surname>Ng</surname><given-names>SK</given-names></name></person-group>
					<year>2004</year>
					<article-title>Discovery of binding motif pairs from protein complex structural data and protein interaction sequence data.</article-title>
					<source>Pac Symp Biocomput</source>
					<fpage>312</fpage>
					<lpage>323</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b023"><label>23</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Neduva</surname><given-names>V</given-names></name><name name-style="western"><surname>Linding</surname><given-names>R</given-names></name><name name-style="western"><surname>Su-Angrand</surname><given-names>I</given-names></name><name name-style="western"><surname>Stark</surname><given-names>A</given-names></name><name name-style="western"><surname>de Masi</surname><given-names>F</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>Systematic discovery of new recognition peptides mediating protein interaction networks.</article-title>
					<source>PLoS Biol</source>
					<volume>3</volume>
					<elocation-id>e405</elocation-id>
				</element-citation></ref><ref id="pcbi-0030182-b024"><label>24</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>H</given-names></name><name name-style="western"><surname>Segal</surname><given-names>E</given-names></name><name name-style="western"><surname>Ben-Hur</surname><given-names>A</given-names></name><name name-style="western"><surname>Koller</surname><given-names>D</given-names></name><name name-style="western"><surname>Brutlag</surname><given-names>D</given-names></name></person-group>
					<year>2005</year>
					<article-title>Identifying protein–protein interaction sites on a genome-wide scale.</article-title>
					<comment>In</comment>
					<person-group person-group-type="editor"><name name-style="western"><surname>Saul</surname><given-names>LK</given-names></name><name name-style="western"><surname>Weiss</surname><given-names>Y</given-names></name><name name-style="western"><surname>Bottou</surname><given-names>L</given-names></name></person-group>
					<source>Proceedings of the Conference Advances in Neural Information Processing Systems (NIPS)</source>
					<conf-date>13–18 December, 2004;</conf-date>
					<conf-loc>Cambridge, Massachusetts, United States.</conf-loc>
					<publisher-loc>Vancouver, Canada</publisher-loc>
					<fpage>1465</fpage>
					<lpage>1472</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b025"><label>25</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Shen</surname><given-names>J</given-names></name><name name-style="western"><surname>Zhang</surname><given-names>J</given-names></name><name name-style="western"><surname>Luo</surname><given-names>X</given-names></name><name name-style="western"><surname>Zhu</surname><given-names>W</given-names></name><name name-style="western"><surname>Yu</surname><given-names>K</given-names></name><etal/></person-group>
					<year>2007</year>
					<article-title>Predicting protein–protein interactions based only on sequences information.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>104</volume>
					<fpage>4337</fpage>
					<lpage>4341</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b026"><label>26</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Hou</surname><given-names>T</given-names></name><name name-style="western"><surname>Chen</surname><given-names>K</given-names></name><name name-style="western"><surname>McLaughlin</surname><given-names>WA</given-names></name><name name-style="western"><surname>Lu</surname><given-names>B</given-names></name><name name-style="western"><surname>Wang</surname><given-names>W</given-names></name></person-group>
					<year>2006</year>
					<article-title>Computational analysis and prediction of the binding motif and protein interacting partners of the Abl SH3 domain.</article-title>
					<source>PLoS Comput Biol</source>
					<volume>2</volume>
					<elocation-id>e1</elocation-id>
				</element-citation></ref><ref id="pcbi-0030182-b027"><label>27</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Reiss</surname><given-names>DJ</given-names></name><name name-style="western"><surname>Schwikowski</surname><given-names>B</given-names></name></person-group>
					<year>2004</year>
					<article-title>Predicting protein–peptide interactions via a network-based motif sampler.</article-title>
					<source>Bioinformatics</source>
					<volume>20</volume>
					<issue>(Supplement 1)</issue>
					<fpage>I274</fpage>
					<lpage>I282</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b028"><label>28</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Salama</surname><given-names>JJ</given-names></name><name name-style="western"><surname>Donaldson</surname><given-names>I</given-names></name><name name-style="western"><surname>Hogue</surname><given-names>CW</given-names></name></person-group>
					<year>2001</year>
					<article-title>Automatic annotation of BIND molecular interactions from three-dimensional structures.</article-title>
					<source>Biopolymers</source>
					<volume>61</volume>
					<fpage>111</fpage>
					<lpage>120</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b029"><label>29</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>DeLano</surname><given-names>WL</given-names></name><name name-style="western"><surname>Ultsch</surname><given-names>MH</given-names></name><name name-style="western"><surname>de Vos</surname><given-names>AM</given-names></name><name name-style="western"><surname>Wells</surname><given-names>JA</given-names></name></person-group>
					<year>2000</year>
					<article-title>Convergent solutions to binding at a protein–protein interface.</article-title>
					<source>Science</source>
					<volume>287</volume>
					<fpage>1279</fpage>
					<lpage>1283</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b030"><label>30</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Gavin</surname><given-names>AC</given-names></name><name name-style="western"><surname>Bosche</surname><given-names>M</given-names></name><name name-style="western"><surname>Krause</surname><given-names>R</given-names></name><name name-style="western"><surname>Grandi</surname><given-names>P</given-names></name><name name-style="western"><surname>Marzioch</surname><given-names>M</given-names></name><etal/></person-group>
					<year>2002</year>
					<article-title>Functional organization of the yeast proteome by systematic analysis of protein complexes.</article-title>
					<source>Nature</source>
					<volume>415</volume>
					<fpage>141</fpage>
					<lpage>147</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b031"><label>31</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Ho</surname><given-names>Y</given-names></name><name name-style="western"><surname>Gruhler</surname><given-names>A</given-names></name><name name-style="western"><surname>Heilbut</surname><given-names>A</given-names></name><name name-style="western"><surname>Bader</surname><given-names>GD</given-names></name><name name-style="western"><surname>Moore</surname><given-names>L</given-names></name><etal/></person-group>
					<year>2002</year>
					<article-title>Systematic identification of protein complexes in <named-content content-type="genus-species" xlink:type="simple">Saccharomyces cerevisiae</named-content> by mass spectrometry.</article-title>
					<source>Nature</source>
					<volume>415</volume>
					<fpage>180</fpage>
					<lpage>183</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b032"><label>32</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Thompson</surname><given-names>W</given-names></name><name name-style="western"><surname>Rouchka</surname><given-names>EC</given-names></name><name name-style="western"><surname>Lawrence</surname><given-names>CE</given-names></name></person-group>
					<year>2003</year>
					<article-title>Gibbs recursive sampler: Finding transcription factor binding sites.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>31</volume>
					<fpage>3580</fpage>
					<lpage>3585</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b033"><label>33</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Reguly</surname><given-names>T</given-names></name><name name-style="western"><surname>Breitkreutz</surname><given-names>A</given-names></name><name name-style="western"><surname>Boucher</surname><given-names>L</given-names></name><name name-style="western"><surname>Breitkreutz</surname><given-names>BJ</given-names></name><name name-style="western"><surname>Hon</surname><given-names>GC</given-names></name><etal/></person-group>
					<year>2006</year>
					<article-title>Comprehensive curation and analysis of global interaction networks in <named-content content-type="genus-species" xlink:type="simple">Saccharomyces cerevisiae</named-content>.</article-title>
					<source>J Biol</source>
					<volume>5</volume>
					<fpage>11</fpage>
				</element-citation></ref><ref id="pcbi-0030182-b034"><label>34</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Hernando</surname><given-names>Y</given-names></name><name name-style="western"><surname>Carter</surname><given-names>AT</given-names></name><name name-style="western"><surname>Parr</surname><given-names>A</given-names></name><name name-style="western"><surname>Hove-Jensen</surname><given-names>B</given-names></name><name name-style="western"><surname>Schweizer</surname><given-names>M</given-names></name></person-group>
					<year>1999</year>
					<article-title>Genetic analysis and enzyme activity suggest the existence of more than one minimal functional unit capable of synthesizing phosphoribosyl pyrophosphate in <named-content content-type="genus-species" xlink:type="simple">Saccharomyces cerevisiae</named-content>.</article-title>
					<source>J Biol Chem</source>
					<volume>274</volume>
					<fpage>12480</fpage>
					<lpage>12487</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b035"><label>35</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Larroy</surname><given-names>C</given-names></name><name name-style="western"><surname>Pares</surname><given-names>X</given-names></name><name name-style="western"><surname>Biosca</surname><given-names>JA</given-names></name></person-group>
					<year>2002</year>
					<article-title>Characterization of a <named-content content-type="genus-species" xlink:type="simple">Saccharomyces cerevisiae</named-content> NADP(H)–dependent alcohol dehydrogenase (ADHVII), a member of the cinnamyl alcohol dehydrogenase family.</article-title>
					<source>Eur J Biochem</source>
					<volume>269</volume>
					<fpage>5738</fpage>
					<lpage>5745</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b036"><label>36</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Krogan</surname><given-names>NJ</given-names></name><name name-style="western"><surname>Keogh</surname><given-names>MC</given-names></name><name name-style="western"><surname>Datta</surname><given-names>N</given-names></name><name name-style="western"><surname>Sawa</surname><given-names>C</given-names></name><name name-style="western"><surname>Ryan</surname><given-names>OW</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>A Snf2 family ATPase complex required for recruitment of the histone H2A variant Htz1.</article-title>
					<source>Mol Cell</source>
					<volume>12</volume>
					<fpage>1565</fpage>
					<lpage>1576</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b037"><label>37</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Fan</surname><given-names>CY</given-names></name><name name-style="western"><surname>Lee</surname><given-names>S</given-names></name><name name-style="western"><surname>Cyr</surname><given-names>DM</given-names></name></person-group>
					<year>2003</year>
					<article-title>Mechanisms for regulation of Hsp70 function by Hsp40.</article-title>
					<source>Cell Stress Chaperones</source>
					<volume>8</volume>
					<fpage>309</fpage>
					<lpage>316</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b038"><label>38</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Cramer</surname><given-names>P</given-names></name></person-group>
					<year>2002</year>
					<article-title>Multisubunit RNA polymerases.</article-title>
					<source>Curr Opin Struct Biol</source>
					<volume>12</volume>
					<fpage>89</fpage>
					<lpage>97</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b039"><label>39</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Lalo</surname><given-names>D</given-names></name><name name-style="western"><surname>Carles</surname><given-names>C</given-names></name><name name-style="western"><surname>Sentenac</surname><given-names>A</given-names></name><name name-style="western"><surname>Thuriaux</surname><given-names>P</given-names></name></person-group>
					<year>1993</year>
					<article-title>Interactions between three common subunits of yeast RNA polymerases I and III.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>90</volume>
					<fpage>5524</fpage>
					<lpage>5528</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b040"><label>40</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Visintin</surname><given-names>R</given-names></name><name name-style="western"><surname>Craig</surname><given-names>K</given-names></name><name name-style="western"><surname>Hwang</surname><given-names>ES</given-names></name><name name-style="western"><surname>Prinz</surname><given-names>S</given-names></name><name name-style="western"><surname>Tyers</surname><given-names>M</given-names></name><etal/></person-group>
					<year>1998</year>
					<article-title>The phosphatase Cdc14 triggers mitotic exit by reversal of Cdk-dependent phosphorylation.</article-title>
					<source>Mol Cell</source>
					<volume>2</volume>
					<fpage>709</fpage>
					<lpage>718</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b041"><label>41</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Nelson</surname><given-names>B</given-names></name><name name-style="western"><surname>Kurischko</surname><given-names>C</given-names></name><name name-style="western"><surname>Horecka</surname><given-names>J</given-names></name><name name-style="western"><surname>Mody</surname><given-names>M</given-names></name><name name-style="western"><surname>Nair</surname><given-names>P</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>RAM: A conserved signaling network that regulates Ace2p transcriptional activity and polarized morphogenesis.</article-title>
					<source>Mol Biol Cell</source>
					<volume>14</volume>
					<fpage>3782</fpage>
					<lpage>3803</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b042"><label>42</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Bidlingmaier</surname><given-names>S</given-names></name><name name-style="western"><surname>Weiss</surname><given-names>EL</given-names></name><name name-style="western"><surname>Seidel</surname><given-names>C</given-names></name><name name-style="western"><surname>Drubin</surname><given-names>DG</given-names></name><name name-style="western"><surname>Snyder</surname><given-names>M</given-names></name></person-group>
					<year>2001</year>
					<article-title>The Cbk1p pathway is important for polarized cell growth and cell separation in <named-content content-type="genus-species" xlink:type="simple">Saccharomyces cerevisiae</named-content>.</article-title>
					<source>Mol Cell Biol</source>
					<volume>21</volume>
					<fpage>2449</fpage>
					<lpage>2462</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b043"><label>43</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Brenner</surname><given-names>S</given-names></name></person-group>
					<year>2002</year>
					<article-title>Life sentences: Ontology recapitulates philology.</article-title>
					<source>Genome Biol</source>
					<volume>3</volume>
					<comment>COMMENT1006. doi:<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1186/gb-2002-3-4-comment1006" xlink:type="simple">10.1186/gb-2002-3-4-comment1006</ext-link></comment>
				</element-citation></ref><ref id="pcbi-0030182-b044"><label>44</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Tong</surname><given-names>AH</given-names></name><name name-style="western"><surname>Drees</surname><given-names>B</given-names></name><name name-style="western"><surname>Nardelli</surname><given-names>G</given-names></name><name name-style="western"><surname>Bader</surname><given-names>GD</given-names></name><name name-style="western"><surname>Brannetti</surname><given-names>B</given-names></name><etal/></person-group>
					<year>2002</year>
					<article-title>A combined experimental and computational strategy to define protein interaction networks for peptide recognition modules.</article-title>
					<source>Science</source>
					<volume>295</volume>
					<fpage>321</fpage>
					<lpage>324</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b045"><label>45</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Yaffe</surname><given-names>MB</given-names></name><name name-style="western"><surname>Cantley</surname><given-names>LC</given-names></name></person-group>
					<year>2000</year>
					<article-title>Mapping specificity determinants for protein–protein association using protein fusions and random peptide libraries.</article-title>
					<source>Methods Enzymol</source>
					<volume>328</volume>
					<fpage>157</fpage>
					<lpage>170</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b046"><label>46</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>J</given-names></name><name name-style="western"><surname>Rost</surname><given-names>B</given-names></name></person-group>
					<year>2002</year>
					<article-title>Target space for structural genomics revisited.</article-title>
					<source>Bioinformatics</source>
					<volume>18</volume>
					<fpage>922</fpage>
					<lpage>933</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b047"><label>47</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Peng</surname><given-names>K</given-names></name><name name-style="western"><surname>Obradovic</surname><given-names>Z</given-names></name><name name-style="western"><surname>Vucetic</surname><given-names>S</given-names></name></person-group>
					<year>2004</year>
					<article-title>Exploring bias in the Protein Data Bank using contrast classifiers.</article-title>
					<source>Pac Symp Biocomput</source>
					<fpage>435</fpage>
					<lpage>446</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b048"><label>48</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Chandonia</surname><given-names>JM</given-names></name><name name-style="western"><surname>Brenner</surname><given-names>SE</given-names></name></person-group>
					<year>2006</year>
					<article-title>The impact of structural genomics: Expectations and outcomes.</article-title>
					<source>Science</source>
					<volume>311</volume>
					<fpage>347</fpage>
					<lpage>351</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b049"><label>49</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Henrick</surname><given-names>K</given-names></name><name name-style="western"><surname>Thornton</surname><given-names>JM</given-names></name></person-group>
					<year>1998</year>
					<article-title>PQS: A protein quaternary structure file server.</article-title>
					<source>Trends Biochem Sci</source>
					<volume>23</volume>
					<fpage>358</fpage>
					<lpage>361</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b050"><label>50</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Marchler-Bauer</surname><given-names>A</given-names></name><name name-style="western"><surname>Anderson</surname><given-names>JB</given-names></name><name name-style="western"><surname>DeWeese-Scott</surname><given-names>C</given-names></name><name name-style="western"><surname>Fedorova</surname><given-names>ND</given-names></name><name name-style="western"><surname>Geer</surname><given-names>LY</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>CDD: A curated Entrez database of conserved domain alignments.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>31</volume>
					<fpage>383</fpage>
					<lpage>387</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b051"><label>51</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Mulder</surname><given-names>NJ</given-names></name><name name-style="western"><surname>Apweiler</surname><given-names>R</given-names></name><name name-style="western"><surname>Attwood</surname><given-names>TK</given-names></name><name name-style="western"><surname>Bairoch</surname><given-names>A</given-names></name><name name-style="western"><surname>Barrell</surname><given-names>D</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>The InterPro Database, 2003 brings increased coverage and new features.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>31</volume>
					<fpage>315</fpage>
					<lpage>318</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b052"><label>52</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Alfarano</surname><given-names>C</given-names></name><name name-style="western"><surname>Andrade</surname><given-names>CE</given-names></name><name name-style="western"><surname>Anthony</surname><given-names>K</given-names></name><name name-style="western"><surname>Bahroos</surname><given-names>N</given-names></name><name name-style="western"><surname>Bajec</surname><given-names>M</given-names></name><etal/></person-group>
					<year>2005</year>
					<article-title>The Biomolecular Interaction Network Database and related tools 2005 update.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>33</volume>
					<fpage>D418</fpage>
					<lpage>D424</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b053"><label>53</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Salwinski</surname><given-names>L</given-names></name><name name-style="western"><surname>Miller</surname><given-names>CS</given-names></name><name name-style="western"><surname>Smith</surname><given-names>AJ</given-names></name><name name-style="western"><surname>Pettit</surname><given-names>FK</given-names></name><name name-style="western"><surname>Bowie</surname><given-names>JU</given-names></name><etal/></person-group>
					<year>2004</year>
					<article-title>The Database of Interacting Proteins: 2004 update.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>32</volume>
					<fpage>D449</fpage>
					<lpage>D451</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b054"><label>54</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Zanzoni</surname><given-names>A</given-names></name><name name-style="western"><surname>Montecchi-Palazzi</surname><given-names>L</given-names></name><name name-style="western"><surname>Quondam</surname><given-names>M</given-names></name><name name-style="western"><surname>Ausiello</surname><given-names>G</given-names></name><name name-style="western"><surname>Helmer-Citterich</surname><given-names>M</given-names></name><etal/></person-group>
					<year>2002</year>
					<article-title>MINT: A Molecular INTeraction database.</article-title>
					<source>FEBS Lett</source>
					<volume>513</volume>
					<fpage>135</fpage>
					<lpage>140</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b055"><label>55</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Hermjakob</surname><given-names>H</given-names></name><name name-style="western"><surname>Montecchi-Palazzi</surname><given-names>L</given-names></name><name name-style="western"><surname>Lewington</surname><given-names>C</given-names></name><name name-style="western"><surname>Mudali</surname><given-names>S</given-names></name><name name-style="western"><surname>Kerrien</surname><given-names>S</given-names></name><etal/></person-group>
					<year>2004</year>
					<article-title>IntAct: An open source molecular interaction database.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>32</volume>
					<fpage>D452</fpage>
					<lpage>D455</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b056"><label>56</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Neuwald</surname><given-names>AF</given-names></name><name name-style="western"><surname>Liu</surname><given-names>JS</given-names></name><name name-style="western"><surname>Lawrence</surname><given-names>CE</given-names></name></person-group>
					<year>1995</year>
					<article-title>Gibbs motif sampling: Detection of bacterial outer membrane protein repeats.</article-title>
					<source>Protein Sci</source>
					<volume>4</volume>
					<fpage>1618</fpage>
					<lpage>1632</lpage>
				</element-citation></ref><ref id="pcbi-0030182-b057"><label>57</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Schneider</surname><given-names>TD</given-names></name><name name-style="western"><surname>Stephens</surname><given-names>RM</given-names></name></person-group>
					<year>1990</year>
					<article-title>Sequence logos: A new way to display consensus sequences.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>18</volume>
					<fpage>6097</fpage>
					<lpage>6100</lpage>
				</element-citation></ref></ref-list></back></article>