<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-9-629</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>An evolutionary and structural characterization of mammalian protein complex organization</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Wong</snm>
               <fnm>Philip</fnm>
               <insr iid="I1"/>
               <email>philip.wong@helmholtz-muenchen.de</email>
            </au>
            <au id="A2" ce="yes">
               <snm>Althammer</snm>
               <fnm>Sonja</fnm>
               <insr iid="I1"/>
               <email>sonjalthammer@yahoo.com</email>
            </au>
            <au id="A3" ce="yes">
               <snm>Hildebrand</snm>
               <fnm>Andrea</fnm>
               <insr iid="I1"/>
               <email>andrea.hildebrand@gmail.com</email>
            </au>
            <au id="A4" ce="yes">
               <snm>Kirschner</snm>
               <fnm>Andreas</fnm>
               <insr iid="I2"/>
               <email>a.kirschner@wzw.tum.de</email>
            </au>
            <au id="A5" ce="yes">
               <snm>Pagel</snm>
               <fnm>Philipp</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>p.pagel@helmholtz-muenchen.de</email>
            </au>
            <au id="A6">
               <snm>Geissler</snm>
               <fnm>Bernd</fnm>
               <insr iid="I2"/>
               <email>insight@web.de</email>
            </au>
            <au id="A7">
               <snm>Smialowski</snm>
               <fnm>Pawel</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>pawel@wzw.tum.de</email>
            </au>
            <au id="A8">
               <snm>Bl&#246;chl</snm>
               <fnm>Florian</fnm>
               <insr iid="I1"/>
               <email>florian.bloechl@helmholtz-muenchen.de</email>
            </au>
            <au id="A9">
               <snm>Oesterheld</snm>
               <fnm>Matthias</fnm>
               <insr iid="I1"/>
               <email>oesterh@yahoo.de</email>
            </au>
            <au id="A10">
               <snm>Schmidt</snm>
               <fnm>Thorsten</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>t.schmidt@wzw.tum.de</email>
            </au>
            <au id="A11">
               <snm>Strack</snm>
               <fnm>Normann</fnm>
               <insr iid="I1"/>
               <email>norman.strack@helmholtz-muenchen.de</email>
            </au>
            <au id="A12">
               <snm>Theis</snm>
               <mi>J</mi>
               <fnm>Fabian</fnm>
               <insr iid="I1"/>
               <insr iid="I3"/>
               <email>fabian.theis@helmholtz-muenchen.de</email>
            </au>
            <au id="A13">
               <snm>Ruepp</snm>
               <fnm>Andreas</fnm>
               <insr iid="I1"/>
               <email>andreas.ruepp@helmholtz-muenchen.de</email>
            </au>
            <au id="A14" ca="yes">
               <snm>Frishman</snm>
               <fnm>Dmitrij</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>d.frishman@wzw.tum.de</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Helmholtz Center Munich &#8211; German Research Center for Environmental Health (GmbH), Institute of Bioinformatics and Systems Biology, Ingolst&#228;dter Landstra&#223;e 1 D-85764 Neuherberg, Germany</p>
            </ins>
            <ins id="I2">
               <p>Department of Genome Oriented Bioinformatics, Technische Universit&#228;t M&#252;nchen, Wissenschaftzentrum Weihenstephan, 85350 Freising, Germany</p>
            </ins>
            <ins id="I3">
               <p>Max-Planck-Institute for Dynamics and Self-Organization, Bunsenstrasse 10, 37073 G&#246;ttingen, Germany</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>1</issue>
         <fpage>629</fpage>
         <url>http://www.biomedcentral.com/1471-2164/9/629</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">19108706</pubid>
               <pubid idtype="doi">10.1186/1471-2164-9-629</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>17</day>
               <month>7</month>
               <year>2008</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>23</day>
               <month>12</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>23</day>
               <month>12</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>Wong et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>We have recently released a comprehensive, manually curated database of mammalian protein complexes called CORUM. Combining CORUM with other resources, we assembled a dataset of over 2700 mammalian complexes. The availability of a rich information resource allows us to search for organizational properties concerning these complexes.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>As the complexity of a protein complex in terms of the number of unique subunits increases, we observed that the number of such complexes and the mean non-synonymous to synonymous substitution ratio of associated genes tend to decrease. Similarly, as the number of different complexes a given protein participates in increases, the number of such proteins and the substitution ratio of the associated gene also tends to decrease. These observations provide evidence relating natural selection and the organization of mammalian complexes. We also observed greater homogeneity in terms of predicted protein isoelectric points, secondary structure and substitution ratio in annotated versus randomly generated complexes. A large proportion of the protein content and interactions in the complexes could be predicted from known binary protein-protein and domain-domain interactions. In particular, we found that large proteins interact preferentially with much smaller proteins.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>We observed similar trends in yeast and other data. Our results support the existence of conserved relations associated with the mammalian protein complexes.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Knowledge of constraints governing systems provides a means to predict events and mechanisms that cause their breakdown. It may also allow one to speculate how such systems might have evolved. One class of biological systems that have captured much interest involves protein-protein interactions and protein complexes. Protein complexes are groups of two or more proteins that physically interact. Such interaction serves to spatially join, modify or create novel functional capability from component proteins. Once in a complex, proteins can achieve greater structural stabilization and protection from proteases, which result in significantly longer half-lives <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr></abbrgrp>. A breakdown in complex assembly has been associated with a number of diseases <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>.</p>
         <p>What forces have shaped the formation of complexes and what is their effect? The formation of quaternary structure is associated with greater constraint in the evolution of proteins <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr></abbrgrp>. Recently, a large collection of manually annotated mammalian complexes has become available in the CORUM database <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. The combination of data from this resource and complexes derived from HPRD <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> and BIND <abbrgrp><abbr bid="B11">11</abbr></abbrgrp> allows for one of the largest investigations of complex-specific protein constraints in mammalian species to date.</p>
         <p>Recently, complexes have been investigated in the context of intrinsic disorder <abbrgrp><abbr bid="B12">12</abbr></abbrgrp> and aggregation propensity of the subunits <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. In this study, we focus on two characteristics of complexes: the complexity of a complex as represented by the number of unique proteins in a complex and the number of complexes a particular protein participates in. The number of protein subunits that bind together fluctuates in the context of different conditions. Complexes extracted from cells can be viewed as snapshot samples of proteins that have come together with adequate stability to be isolated. We subsequently derive 'complex participation' for individual proteins by counting the number of complexes that they belong to, in our large combined collection of protein complex samples.</p>
         <p>Although these characteristics of complexes are dynamic, their relation to properties of component proteins derived in their isolated state can be studied. By deriving these relations, we hope to gain insight into certain constraints governing the organization of complexes. Here, we find evidence that protein length, predicted secondary structure and isoelectric point, as well as the nonsynonymous/synonymous substitution ratio of genes are associated with our measures of complex complexity and participation.</p>
         <p>Available data on protein-protein interactions have been used extensively to predict complexes <abbrgrp><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr><abbr bid="B25">25</abbr></abbrgrp>. A strong discriminator between interacting and non-interacting protein pairs appears to be the presence of domains known to interact <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. We assess the utility of known binary protein-protein and domain-domain interactions in predicting the composition and interactions in the mammalian complexes that we have collected.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Complex and Interaction data</p>
            </st>
            <p>1732 experimentally verified protein complexes annotated at MIPS <abbrgrp><abbr bid="B27">27</abbr></abbrgrp> and stored in the CORUM database <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> were combined with 631 complexes retrieved from HPRD <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> and 538 complexes from BIND <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. After removal of redundancy, there were 2706 different complexes containing 4543 different proteins from human, mouse, rat, dog, rabbit, cow, pig and other mammals. Of these 2706 unique complexes, 665 are subcomplexes of other complexes in the data. A more detailed description of the complexes appears in the additional files [see Additional file <supplr sid="S1">1</supplr>].</p>
            <suppl id="S1">
               <title>
                  <p>Additional File 1</p>
               </title>
               <text>
                  <p><b>Description of the protein complex data.</b> A detailed description of annotated and random complex data used.</p>
               </text>
               <file name="1471-2164-9-629-S1.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>The focus of this study was on mammalian complexes but we also analyzed the MIPS yeast complexes stored in CYGD <abbrgrp><abbr bid="B28">28</abbr></abbrgrp>. We use a set of 1142 unique yeast complexes consisting of 2755 proteins. A much larger set of yeast complexes consisting of 5370 proteins in 2025 complexes was produced by merging the MIPS yeast complexes with the 893 complexes predicted by Friedel et al. <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. We will refer to this set of complexes as the 'extended yeast complex set'. Possible estimates of the completeness of the human and yeast complex data appear in the additional files [see Additional file <supplr sid="S1">1</supplr>].</p>
            <p>We assembled 94906 pairwise eukaryotic protein-protein interactions from BIND, DIP <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>, HPRD, MINT <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>, Mpact <abbrgrp><abbr bid="B31">31</abbr></abbrgrp> and MPPI <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. 29074 of those interactions were between different proteins from human, mouse or rat and were used in this study. We also retrieved 127514 binary protein interactions by over 36500 proteins from IntAct <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. We will refer to interaction data from IntAct in the text specifically with the word 'IntAct' to distinguish from the interaction set we collected.</p>
            <p>We refer as domain-domain interactions in the text as those derived from known 3D structures of proteins, obtained from the iPfam <abbrgrp><abbr bid="B34">34</abbr></abbrgrp> and 3did <abbrgrp><abbr bid="B35">35</abbr></abbrgrp> database. There are 3654 such interactions between protein domains in total. Pfam domains of protein sequences were taken from Uniprot <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. We assume that peptide chains in PDB structures with C-beta atoms within 8 Angstroms of each other interact.</p>
            <p>We generated random complexes using two different random models to evaluate significance of trends associated with non-stochastic protein complex organization. For the random model in the main text (Model 1), we generated the same number of random complexes as found in annotated complexes by picking the same number of proteins as found in each of the annotated complexes from a pool of all proteins collected from these complexes. We picked proteins randomly with replacement throughout the process of random complex generation to simulate neutrality of protein reuse in the complexes. A second random model (Model 2) of the complexes which uses the complex complexity and participation preserving rewiring method, first introduced by Maslov and Sneppen <abbrgrp><abbr bid="B37">37</abbr></abbrgrp> was also tested [see Additional file <supplr sid="S1">1</supplr>]. In certain parts of this paper, we used sets of randomly generated complexes (each set containing the same number of complexes as found in the annotated complexes) in Monte-Carlo simulations (denoted MC-test) to derive p-values for significance statements. P-values of events were estimated by the fraction of random simulations supporting the null hypothesis.</p>
         </sec>
         <sec>
            <st>
               <p>Computed features of genes and proteins</p>
            </st>
            <p>Secondary structure was predicted with PSIPRED <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. Our conclusions did not change when we repeated our experiments using SSPRO <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>. The performance of PSIPRED in terms of secondary structure content prediction is benchmarked [see Additional file <supplr sid="S2">2</supplr>]. We measured human protein evolutionary rates by non-synonymous to synonymous substitution (<it>dN/dS</it>) ratios computed from coding sequences of ortholog pairs from Ensembl <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. Yeast (<it>S. cerevisiae</it>) gene <it>dN/dS </it>ratios were computed using orthologs <abbrgrp><abbr bid="B41">41</abbr></abbrgrp> from <it>S. mikatae </it>by PAL2NAL <abbrgrp><abbr bid="B42">42</abbr></abbrgrp> with default parameters and Codeml from the PAML package <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. The smallest <it>dN/dS </it>ratio was recorded for each gene when more than one potential ortholog was identified (our conclusions did not change if we chose the larger one). The values of <it>dN/dS </it>depend on the calculation methodology but they should be comparable within the same species pairs chosen. Note that only <it>dN/dS </it>ratios less than 1 (computed from human-mouse orthologs) were associated with the annotated human complexes. The mean <it>dN/dS </it>ratio of individual genes encoding a given protein complex was taken as a measure of selection associated with the protein complex. We focused on a measure of evolutionary rate reflecting more on changes in protein sequence. We considered evolution at synonymous sites <abbrgrp><abbr bid="B44">44</abbr><abbr bid="B45">45</abbr></abbrgrp> to be neutral.</p>
            <suppl id="S2">
               <title>
                  <p>Additional File 2</p>
               </title>
               <text>
                  <p><b>Benchmark of PSIPRED.</b> A benchmark of PSIPRED's ability to predict secondary structure content from protein sequences is provided.</p>
               </text>
               <file name="1471-2164-9-629-S2.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>We refer to "pI" in the text as values obtained from BioPerl-based <abbrgrp><abbr bid="B46">46</abbr></abbrgrp> isoelectric point prediction on protein sequences. Essential genes for <it>S. cerevisiae </it>were taken from CYGD <abbrgrp><abbr bid="B28">28</abbr></abbrgrp>. Essential genes for human were gathered by merging those from <abbrgrp><abbr bid="B47">47</abbr></abbrgrp> and Table S6 of <abbrgrp><abbr bid="B48">48</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Statistics of trends in 2-D plots</p>
            </st>
            <p>We assessed trends concerning 2-dimensional protein complex data by first applying standard linear regression to see if there is a noticeable slope different from a horizontal line (observed when the y values do not depend on the x values). We considered a given trend to be significantly associated with non-stochastic protein complex organization if the p-value reported by the t-test on the slope of the regression line (the null hypothesis being a slope = 0) was less than the maximum value observed when 1000 sets of random human or yeast complexes were generated. For example, when random complexes were generated from entire sets of annotated complexes, p-values associated with plots between mean <it>dN/dS </it>values and complex complexity for these random complexes were always above 0.003; so we set this value as a threshold of significance for such trends. However, the use of the t-test by itself is potentially inadequate because it could be significantly affected by biases in our snap-shot protein complex samples. So in addition, we repeated the same plots using sets of complexes likely to have different biases. These include the MIPS yeast complexes, the extended yeast complex set, sets of complexes where subcomplexes were removed and sets of complexes in different subcellular compartments. Unless otherwise stated, only those trends in which all assessments (from the regression line analysis to the analysis with other complex datasets) are considered significant are reported. Analysis was aided by the PROMPT tool <abbrgrp><abbr bid="B49">49</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>Complex Complexity and Participation</p>
            </st>
            <p>We first examined the distribution of complex complexity, the number of unique proteins in a complex. Amongst all mammalian complexes collected, the number of unique proteins ranges from one for homo-oligomers to 142 (U2-type spliceosome [CORUM:351]). When the number of unique proteins increases past 4, complexes become increasingly rare following a power law-like distribution (Figure <figr fid="F1">1A</figr>). When we considered yeast complexes, we saw similar trends [see Additional file <supplr sid="S3">3</supplr>].</p>
            <suppl id="S3">
               <title>
                  <p>Additional File 3</p>
               </title>
               <text>
                  <p><b>Yeast complex complexity and participation distributions.</b> The distribution of yeast complex complexity and participation approximately follows a power- law.</p>
               </text>
               <file name="1471-2164-9-629-S3.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Composition of mammalian complexes</p>
               </caption>
               <text>
                  <p><b>Composition of mammalian complexes</b>. A) The number of complexes (y-axis) with a particular number of unique proteins (x-axis) is plotted. B) The number of proteins (y-axis) participating in a particular number of complexes (x-axis) is plotted.</p>
               </text>
               <graphic file="1471-2164-9-629-1"/>
            </fig>
            <p>Not all proteins are exclusive to a single complex. Having defined complex participation as the number of complexes that a particular protein is found in, we find that it also follows a power law-like distribution (Figure <figr fid="F1">1B</figr>, [Additional file <supplr sid="S3">3</supplr>]). Some of the proteins currently with the highest complex participation include human integrin beta-1 [Uniprot:P05556], histone deacetylase 1 [Uniprot:Q13547] and RING-box protein 1 [Uniprot:P62877] which were annotated to be in 54, 39 and 24 complexes, respectively so far.</p>
            <p>The decrease in the number of complexes as the number of subunits increase might be a reflection of the increased difficulty in assembling and thus evolving larger beneficial complexes. Although this trend seems to follow a power law, as commonly reported for biological networks <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>, we could not ascertain if this truly is the case. Similarly, we could not ascertain whether complex participation follows a power law. Our observed complex complexity and participation distributions may be the result of our complexes being samples of mammalian proteins <abbrgrp><abbr bid="B51">51</abbr><abbr bid="B52">52</abbr></abbrgrp> derived under a variety of conditions [Additional file <supplr sid="S1">1</supplr>]. The number of unique proteins in yeast complexes was also observed to follow a similar-shaped distribution and an exponential model of the data has been proposed <abbrgrp><abbr bid="B53">53</abbr><abbr bid="B54">54</abbr></abbrgrp>. In both mammalian and yeast complexes, most proteins belong to few complexes, thus supporting the idea of modularity <abbrgrp><abbr bid="B55">55</abbr></abbrgrp> between complexes in the context of the protein-protein interaction network that have been examined.</p>
         </sec>
         <sec>
            <st>
               <p>The length of proteins in complexes</p>
            </st>
            <p>One of the simplest protein properties to study is the length of the protein in terms of the number of amino acids. The distribution of human protein lengths is skewed towards smaller values and subsequently when we sample uniformly from this distribution to generate random complexes, the distribution of the protein lengths remains skewed (Figure <figr fid="F2">2A</figr>). The mean length of proteins in this distribution is ~500 amino acids (Figure <figr fid="F2">2A</figr>).</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Protein length in human complexes</p>
               </caption>
               <text>
                  <p><b>Protein length in human complexes</b>. A) Length distribution of proteins in human complexes generated randomly from the entire known human proteome. Mean lengths of proteins versus the number of unique subunits in: B) model 1 random complexes generated from the entire proteome C) annotated human complexes D) model 1 random human complexes generated from data we collected.</p>
               </text>
               <graphic file="1471-2164-9-629-2"/>
            </fig>
            <p>By picking proteins with replacement from the distribution of proteins in Figure <figr fid="F2">2A</figr>, we generated random complexes and plotted the complexity of the complexes in terms of the number of unique subunits against the mean length of these subunits (Figure <figr fid="F2">2B</figr>). As complex complexity increases the upper bound for mean lengths of proteins drops (before 20 unique proteins) and levels out at ~510 amino acids for more complex complexes. Because the mean length of proteins in the human proteome which we sample from is ~500 amino acids, as one adds more random proteins to complexes, the mean length of proteins in the complexes tends to stabilize near 500 amino acids. This observation was similarly made in annotated human complexes (Figure <figr fid="F2">2C</figr>) and random complexes generated from this annotated data (Figure <figr fid="F2">2D</figr>). A similar asymptotic bound is thus formed in all our plots. For example, mean lengths of 2000 amino acids were absent in complexes of more than 20 subunits in both the random and the complexes that we have collected. Like for the random human complexes, the mean protein length distribution for the real human complexes (Figure <figr fid="F2">2C</figr>) was also skewed towards smaller protein lengths. Similar plots were observed for all mammalian complexes that we collected and Model 2 random complexes [Additional file <supplr sid="S4">4</supplr>]. These results suggest that the mean protein length in complexes reflects to an observable degree the length distribution of proteins encoded in the proteome (Figure <figr fid="F2">2A</figr>). Similar observations were made when the median length of proteins was studied in the context of complex complexity [Additional file <supplr sid="S5">5</supplr>].</p>
            <suppl id="S4">
               <title>
                  <p>Additional File 4</p>
               </title>
               <text>
                  <p><b>Mammalian complex complexity and protein length. </b>The mean length of proteins in available mammalian complexes is examined with respect to complex complexity.</p>
               </text>
               <file name="1471-2164-9-629-S4.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S5">
               <title>
                  <p>Additional File 5</p>
               </title>
               <text>
                  <p><b>Median length of proteins in annotated human complexes.</b> The median length of proteins in human complexes is examined with respect to complex complexity.</p>
               </text>
               <file name="1471-2164-9-629-S5.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>In contrast to randomly generated complexes, the complexes that we have collected had much more variable mean lengths, especially for complexes with large numbers of subunits. We observe this as an increased scattering of points on the right side of the plot (Figure <figr fid="F2">2C</figr>). This phenomenon was similarly observed in yeast complexes [Additional file <supplr sid="S6">6</supplr>]. In particular, when complex complexity increases past 20 different subunits, complexes with mean protein lengths below 250 amino acids are rarely generated randomly (Random Model 1: P &lt; 10<sup>-6</sup>) but are present in annotated mammalian and yeast complexes. For example, the 81 subunits of the human ribosomal complex [CORUM:306] have a mean length of 169 amino acids and the 37 subunits of the mouse mitochondrial NADH dehydrogenase complex [CORUM:381] have a mean length of 234 amino acids.</p>
            <suppl id="S6">
               <title>
                  <p>Additional File 6</p>
               </title>
               <text>
                  <p><b>Yeast complex complexity and protein length.</b> The mean length of proteins in available yeast complexes is examined with respect to complex complexity.</p>
               </text>
               <file name="1471-2164-9-629-S6.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Although the complexes analyzed are samples of what is in cells, it is a large set that has been manually annotated. Assuming that the plots in Figure <figr fid="F2">2</figr> capture length constraint bounds, they can provide rules of thumb for spot-checking errors in newly isolated complexes. For example, if an isolated human complex of 10 subunits had a mean subunit length of 2000 amino acids, our plots suggest that large numbers of additional missing subunits of length 2000 or more are unlikely. If such a complex did exist, then it would be striking given both the annotated complex data (Figure <figr fid="F2">2C</figr>) and data generated from random complexes (Figure <figr fid="F2">2B</figr>, Figure <figr fid="F2">2D</figr>; [Additional file <supplr sid="S4">4</supplr>]). Unusual property distributions associated with complexes provide initial suggestions of errors in the composition of the complexes or unusual constraints associated with these complexes. For example, the average length of a large sample of human mitochondrial proteins appears to be much smaller than the average length of all human proteins (means &#177; standard deviation/medians are: ~320 &#177; 304/235aa vs. ~500 &#177; 551/364aa, respectively; MW, KS-test (Mann-Whitney, Kolmogorov-Smirnov tests): P &lt; 10<sup>-57</sup>) in the Eukaryotic Subcellular Localization Database <abbrgrp><abbr bid="B56">56</abbr></abbrgrp> [Additional file <supplr sid="S7">7</supplr>]. Similar results were obtained when we used the reference set from MitoP2 <abbrgrp><abbr bid="B57">57</abbr></abbrgrp> as a source of mitochondrial proteins. Despite large amounts of protein turnover since the mitochondria prokaryotic origin <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>, most (> 97%) human mitochondrial proteins have lengths less than 1000 amino acids. These results suggest unusual size constraints associated with mitochondrial proteins. Mitochondria-related functions, the need for proteins to import into the mitochondria <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>, the presence of reactive oxygen species which can impose difficulties for protein folding <abbrgrp><abbr bid="B60">60</abbr></abbrgrp> are possible reasons which may have helped limit the incorporation of very large proteins into mitochondria. The scarcity of large proteins in the mitochondria, in turn, will likely limit mean protein lengths of its complexes. Although many (300/1962 = 15%) human complexes in our data have mean protein lengths over 1000 amino acids (Figure <figr fid="F2">2C</figr>), none of the 28 mitochondrial human complexes we annotated so far exceed this limit. If mean protein lengths in complexes reflect protein length distributions, we expect hetero-oligomeric mitochondria human complexes with mean protein lengths over 1000 amino acids to be extremely rare.</p>
            <suppl id="S7">
               <title>
                  <p>Additional File 7</p>
               </title>
               <text>
                  <p><b>Length distribution of human mitochondrial proteins.</b> The length distribution of human mitochondrial proteins is plotted.</p>
               </text>
               <file name="1471-2164-9-629-S7.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>The relative lack of complexes with many (>20) different large proteins (> 1500aa) in both mammals and yeast suggests that evolving such complexes is also extremely difficult. Smaller subunits may be easier to fold, transport <abbrgrp><abbr bid="B61">61</abbr></abbrgrp>, require less conformation sampling <abbrgrp><abbr bid="B2">2</abbr></abbrgrp> and undergo smaller entropic loss [<abbrgrp><abbr bid="B62">62</abbr></abbrgrp> &#8211; Supplement] during complex assembly. These factors may have contributed to the absence of highly complex complexes with many large proteins in our data.</p>
         </sec>
         <sec>
            <st>
               <p>Natural selection and complexes</p>
            </st>
            <p>To understand observations from a more evolutionary point of view, we analyzed non-synonymous to synonymous substitution ratios (<it>dN/dS</it>) derived from human coding sequences and their alignments with orthologs from mouse (Figure <figr fid="F3">3</figr>). One way of comparing selection on coding sequences associated with different complexes is by their mean <it>dN/dS </it>ratios derived from the same species pairs.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Complexes and selection</p>
               </caption>
               <text>
                  <p><b>Complexes and selection</b>. <it>dN/dS </it>distribution of genes associated with A) all human proteins and B) proteins in the human complex data. D) The mean <it>dN/dS </it>ratio for human-mouse orthologs is plotted against the number of unique proteins in the complex. Complexes with more unique proteins have a significantly smaller mean <it>dN/dS </it>ratios than those with less unique proteins (t-test: P &lt; 3.1 &#215; 10<sup>-7</sup>). F) The <it>dN/dS </it>ratio for human-mouse orthologs is plotted against the number of complexes they participate in. Proteins participating in more complexes have significantly lower <it>dN/dS </it>ratios than those with less complex participation (t-test: P &lt; 7.4 &#215; 10<sup>-9</sup>). C, E) Both trends are rarely observed for model 1 random complexes.</p>
               </text>
               <graphic file="1471-2164-9-629-3"/>
            </fig>
            <p>For example, proteins from the human MBD1-MCAF complex [CORUM:2759] are encoded by two genes with a mean <it>dN/dS </it>ratio of 0.37, computed from mouse orthologs. The sequences coding for this complex seem to be under much less selective constraint than ones coding the eIF3 complex [CORUM:742] which is associated with a mean <it>dN/dS </it>ratio of 0.04 (Stdv. = 0.03, median = 0.02).</p>
            <p>It has been noted previously that easily alignable eukaryotic mRNAs are over-represented for multi-subunit complexes <abbrgrp><abbr bid="B63">63</abbr></abbrgrp> due to increased sequence conservation. In terms of trends, we find that as the complexity of the complex increases, the mean <it>dN/dS </it>ratio of human genes of associated constituent proteins tends to decrease suggesting that complex complexity negatively correlates with purifying selective pressure on genes (Figure <figr fid="F3">3D</figr>). The trend is not extremely strong but such a trend was not observed with random complexes (Figure <figr fid="F3">3C</figr>; [Additional file <supplr sid="S8">8</supplr>]). In particular, complexes with more than 15 proteins and mean <it>dN/dS </it>ratios below 0.07 are absent in our random complex set. For example, the 20 genes from the PA700 proteosome regulator complex [CORUM:32] have a mean <it>dN/dS </it>ratio of 0.03 but such complexes are not likely generated randomly (Random model 1: P &lt; 0.05). A contributing reason can be derived by examining the distribution of <it>dN/dS </it>ratios. The distribution of human-mouse <it>dN/dS </it>ratios is skewed towards small values considering all known human genes with over 40% of the values &lt; 0.1 (Figure <figr fid="F3">3A</figr>). The distribution of <it>dN/dS </it>ratios associated with our sample of annotated complexes (Figure <figr fid="F3">3B</figr>) is likewise skewed with 60% of the values &lt; 0.1. In both cases, the mean <it>dN/dS </it>ratio is close to ~0.1. As more randomly-selected proteins are added to form random complexes, the mean <it>dN/dS </it>ratio for genes associated with the complexes tends to stabilize also at 0.1. Thus, highly complex complexes with mean <it>dN/dS </it>ratios substantially below 0.1 are rarely generated randomly.</p>
            <suppl id="S8">
               <title>
                  <p>Additional File 8</p>
               </title>
               <text>
                  <p><b>Random complexes and dN/dS (Human-Mouse Orthologs).</b> dN/dS ratios of genes associated with model 2 random complexes are examined with respect to complex complexity and participation.</p>
               </text>
               <file name="1471-2164-9-629-S8.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Knowing that many proteins belong to more than one complex, we also asked how this fact was related to selective pressure. We find that as the number of complexes a protein participates in increases, the <it>dN/dS </it>ratio of corresponding genes also tends to decrease (Figure <figr fid="F3">3F</figr>), suggesting that complex participation also correlates negatively with the <it>dN/dS </it>ratio. This trend is not observed when complexes were generated randomly by picking proteins with replacement (Figure <figr fid="F3">3E</figr>). From such randomly generated complexes, proteins participating in more than 10 complexes rarely occur, but they are clearly present in our annotated data. Binned average plots of Figures <figr fid="F3">3D</figr> and <figr fid="F3">3F</figr> appear in the additional files [see Additional file <supplr sid="S9">9</supplr>].</p>
            <suppl id="S9">
               <title>
                  <p>Additional File 9</p>
               </title>
               <text>
                  <p><b>Binned Plots for Figures 3D and 3F</b>.<figr fid="F3">3</figr></p>
               </text>
               <file name="1471-2164-9-629-S9.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Because such results could potentially be sensitive to the ortholog pairs compared, the quality of the gene models, and peculiarities of human/mouse evolution, we also repeated such analyses using a variety of other mammals [see Additional file <supplr sid="S10">10</supplr>]. For human-dog, human-chimp and human-rat orthologs, we observed similar trends although in the closely related human-chimp case in which complex complexity was plotted against mean <it>dN/dS</it>, the trend was not statistically significant. We also had similar observations with yeast complexes using <it>S. cerevisiae </it>&#8211; <it>S. mikatae</it>, <it>S. cerevisiae </it>&#8211; <it>S. paradoxus </it>orthologs. We did not observe such trends from <it>dN/dS </it>ratios derived from the more distant pairing of <it>S. cerevisiae </it>&#8211; <it>S. castellii </it>orthologs (data not shown). For both mammalian and yeast complexes, the trends appear to be conserved using <it>dN/dS </it>ratios generated from a variety of ortholog-pairs with some exceptions.</p>
            <suppl id="S10">
               <title>
                  <p>Additional File 10</p>
               </title>
               <text>
                  <p><b>Protein complexes and dN/dS based on orthologs from a variety of species.</b> dN/dS ratios of genes based on human-dog, human-chimp, human-rat, S. cerevisiae-S. mikatae and S. cerevisiae-S. paradoxus orthologs are examined with respect to complex complexity and participation.</p>
               </text>
               <file name="1471-2164-9-629-S10.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Related to <it>dN/dS </it>ratios is the gene conservation of orthologs of the proteins in complexes. Compared to <it>dN/dS </it>ratios, statistically significant differences in gene conservation are even more difficult to detect in closely related genomes. However, over large evolutionary distances we noticed that highly complex complexes tend to have conserved their subunits. For example, between yeast and human, yeast complexes with more than 60 subunits had more than 80% of their subunits also encoded in human. This was not observed in random complexes [Additional file <supplr sid="S11">11</supplr>]. Yeast complex proteins conserved in human also participated in a significantly higher number of complexes than those without a human ortholog (mean &#177; standard deviation/median complex participation of 8.0 &#177; 6.8/6.0 vs. 4.2 &#177; 4.3/3.0; MW, KS-test: P &lt; 10<sup>-70</sup>). A significant difference in complex participation was not observed for model 1 randomly generated complexes. These results concerning <it>dN/dS </it>ratios and gene conservation portrays similar relationships between gene evolution, complex complexity and participation at different time and constraint scales.</p>
            <suppl id="S11">
               <title>
                  <p>Additional File 11</p>
               </title>
               <text>
                  <p><b>Complexes and gene conservation.</b> The fraction of orthologs conserved in yeast and human complexes is examined against complex complexity.</p>
               </text>
               <file name="1471-2164-9-629-S11.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Because our conclusions are based on a limited sample of complexes, we sought for extra datasets of protein complexes. The combination of the annotated MIPS yeast complexes with those that were predicted <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> allowed us to test our hypotheses on a large set of complexes covering 5370 (88%) of the proteins encoded in the yeast proteome. We continued to observe a significant negative correlation between mean <it>dN/dS </it>with complex complexity and <it>dN/dS </it>with complex participation using such an extended complex dataset [Additional file <supplr sid="S12">12</supplr>].</p>
            <suppl id="S12">
               <title>
                  <p>Additional File 12</p>
               </title>
               <text>
                  <p><b>Extension and subsets of the protein complex data.</b> Extended yeast complexes, complexes with subcomplexes removed, nuclear and non-nuclear complexes are examined with respect to complex complexity and participation.</p>
               </text>
               <file name="1471-2164-9-629-S12.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Often in a cell, complexes exist along side their subcomplexes. In our data, subcomplexes of complexes are present. If we repeated our analysis with subcomplexes removed, we still observed a significant negative correlation between mean <it>dN/dS </it>with complex complexity and <it>dN/dS </it>with complex participation [Additional file <supplr sid="S12">12</supplr>]. Similar trends were also observed when we considered nuclear localized and non-localized complexes separately [Additional file <supplr sid="S12">12</supplr>].</p>
            <p>As complexes are assembled or disassembled, the mean <it>dN/dS </it>ratio should fluctuate as proteins are added or subtracted from the complex. Nevertheless, there also seems to be an asymptotic bound for mean <it>dN/dS </it>ratios as complex complexity increases and <it>dN/dS </it>ratios as complex participation increases. The conserved trends we observe may be a reflection of these bounds. We find that genes associated with our human complexes which are considered essential (see Methods) tend to have lower <it>dN/dS </it>ratios (computed by human-mouse orthologs) and encode proteins that participate in more complexes (MW, KS-test: P &lt; 0.01) compared with all genes in the human complexes. We see the same significant trend for yeast (<it>dN/dS </it>ratios computed with <it>S. cerevisiae </it>&#8211; <it>S. paradoxus </it>orthologs). These results suggest that for proteins participating in increasing number of complexes, lower <it>dN/dS </it>ratios tend to be associated with purifying selection to maintain organism fitness. Essential <it>S. cerevisiae </it>complex proteins tend to be found in complexes with more unique subunits (MW, KS-test: P &lt; 0.05) compared to other proteins in the yeast complex data. However, such a trend was not observed for human possibly because a significant number of proteins which contribute to complex complexity are not known to be essential. We conclude that there is strong evidence of non-random association between <it>dN/dS </it>ratios of genes and complexes of their protein products.</p>
            <p>The finding that the number of protein-protein interactions positively correlates with the level of conservation of orthologs between species <abbrgrp><abbr bid="B64">64</abbr><abbr bid="B65">65</abbr></abbrgrp> is similar to our finding that highly complex complexes tend to conserve their orthologs. Previously, increased gene conservation has been correlated with lower evolutionary rate <abbrgrp><abbr bid="B66">66</abbr></abbrgrp>. We have found that highly complex complexes tend to conserve their orthologs and have lower <it>dN/dS </it>ratios, in agreement with these results.</p>
            <p>In summary, we observed that the mean <it>dN/dS </it>ratios of proteins in the collected complexes tend to decrease with increasing complex complexity. There seem to be at least two major phenomena associated with this observation:</p>
            <p>1) The skewed distribution of <it>dN/dS </it>ratios amongst genes as depicted in Figure <figr fid="F3">3B</figr>. In particular, as complex complexity increases, the mean <it>dN/dS </it>ratios of proteins in complexes tend to stabilize towards the mean of this skewed distribution.</p>
            <p>2) increased selective pressure on proteins involved in the organization and function of more complex complexes</p>
            <p>The median of the mouse <it>dN/dS </it>values (Figure <figr fid="F3">3B</figr>) is 0.08 which is less than the mean of 0.1. When we plotted Figure <figr fid="F3">3D</figr> and related supplements using median <it>dN/dS </it>values instead of the mean, we also found the median <it>dN/dS </it>decreased significantly with increasing number of unique subunits. Such a trend was consistently found when human-mouse, human-dog, human-rat, <it>S. cerevisiae </it>&#8211; <it>S. paradoxus </it>and <it>S. cerevisiae </it>&#8211; <it>S. mikatae dN/dS </it>median values were used (for all plots, t-test: P &lt; 7.1 &#215; 10<sup>-7</sup>; selected plots are shown in the additional files [Additional file <supplr sid="S13">13</supplr>]).</p>
            <suppl id="S13">
               <title>
                  <p>Additional File 13</p>
               </title>
               <text>
                  <p><b>Analysis of protein complex data using the median.</b> Analysis of protein complex data with respect to mean dN/dS ratios and sequence length is compared with analysis using the median.</p>
               </text>
               <file name="1471-2164-9-629-S13.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Thus, for the complex data available, we observed that both the mean and median <it>dN/dS </it>ratios of genes negatively correlates with the complex complexity.</p>
         </sec>
         <sec>
            <st>
               <p>Homogeneity of Protein and Gene Properties</p>
            </st>
            <p>Next, we examined similarities between proteins within mammalian protein complexes (Table <tblr tid="T1">1</tblr>). Although not necessarily similar to physiological pI, our predicted pI values reflect sequence properties which may be of some utility. We ask whether subunits in complexes tend to have greater homogeneity than expected in terms of predicted pI values. Considering complexes of 3 or more unique proteins, we found that the standard deviations in protein pI are significantly lower in the annotated complexes compared to those in model 1 random complexes. Thus, the pI of a protein can be a feature which may be useful in predicting whether the protein belongs to a particular complex or not. The need for subunits to co-localize <abbrgrp><abbr bid="B67">67</abbr></abbrgrp> and the presence of highly sequence similar paralogs in complexes <abbrgrp><abbr bid="B68">68</abbr></abbrgrp> should be contributing factors to our observation of lower than expected pI deviation between complex proteins.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Homogeneity of protein properties in mammalian complexes of 3 or more proteins.</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="center">
                        <p>Protein Complex Data</p>
                     </c>
                     <c ca="center">
                        <p>Property</p>
                     </c>
                     <c ca="center">
                        <p>Mean Stdev. Annotated</p>
                     </c>
                     <c ca="center">
                        <p>Mean Stdev. Random</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>All mammalian</p>
                     </c>
                     <c ca="center">
                        <p>pI</p>
                     </c>
                     <c ca="center">
                        <p>1.5 &#177; 0.7 (1.5)</p>
                     </c>
                     <c ca="center">
                        <p>1.8 &#177; 0.7 (1.8)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>All mammalian</p>
                     </c>
                     <c ca="center">
                        <p>% Helix</p>
                     </c>
                     <c ca="center">
                        <p>14.4 &#177; 7.8 (13.5)</p>
                     </c>
                     <c ca="center">
                        <p>18.6 &#177; 7.5 (18.6)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>All mammalian</p>
                     </c>
                     <c ca="center">
                        <p>% Sheet</p>
                     </c>
                     <c ca="center">
                        <p>9.5 &#177; 5.9 (8.7)</p>
                     </c>
                     <c ca="center">
                        <p>10.9 &#177; 5.4 (10.3)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>All mammalian</p>
                     </c>
                     <c ca="center">
                        <p>% Coil</p>
                     </c>
                     <c ca="center">
                        <p>10.3 &#177; 5.0 (9.8)</p>
                     </c>
                     <c ca="center">
                        <p>13.3 &#177; 5.6 (13)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>Human (against mouse)</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>dN/dS</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0.07 &#177; 0.05 (0.06)</p>
                     </c>
                     <c ca="center">
                        <p>0.09 &#177; 0.06 (0.08)</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>The standard deviations of protein property values for each annotated complex are significantly smaller than ones for model 1 random complexes (MC-test using 1000 complexes generated randomly with replacement: P &lt; 0.001). The means &#177; standard deviation of these standard deviations for each property are shown in the last two columns along with median values (in parentheses).</p>
               </tblfn>
            </tbl>
            <p>The common presence of paralogs in complexes and the correlation between secondary structure and localization <abbrgrp><abbr bid="B69">69</abbr></abbrgrp> also contributes to explaining why we observed significantly lower than expected deviations of secondary structure content (percent helix, sheet and coil) in proteins belonging to the annotated complexes versus those in random complexes.</p>
            <p>Similar to protein properties, we also found that the <it>dN/dS </it>ratio of genes associated with annotated human complexes are significantly more homogeneous compared with those from randomly generated complexes. Some examples of complexes with very low deviation of <it>dN/dS </it>values include Ubiquitin E3 ligase [CORUM:386] and the MKK4-ARRB2-ASK1 complex [CORUM:1297] with a standard deviation of 0.0007 and 0.001, respectively. The complex with the highest observed <it>dN/dS </it>deviation of 0.34 is the DNA ligase IV-XRCC4-XLF complex [CORUM:359]. Significant differences between random and annotated complexes were also observed when the <it>dN/dS </it>ratio was computed with dog, rat, or chimp orthologs (data not shown). These observations agree with previous results providing evidence that yeast proteins belonging to the same functional module tend to have more similar evolutionary rates than those belonging to different modules <abbrgrp><abbr bid="B70">70</abbr></abbrgrp>. We observed similar results when we examined yeast complexes [Additional file <supplr sid="S14">14</supplr>] and when we generated model 2 random mammalian and yeast complexes (data not shown).</p>
            <suppl id="S14">
               <title>
                  <p>Additional File 14</p>
               </title>
               <text>
                  <p><b>Homogeneity of Protein Properties in Yeast Complexes.</b> Deviation in pI, secondary structure and evolutionary rate between proteins in annotated yeast complexes are compared to those in random complexes.</p>
               </text>
               <file name="1471-2164-9-629-S14.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>To conclude, we suggest that pI, secondary structure and <it>dN/dS </it>ratios can be used to help predict the probability that a protein belongs to a particular complex. We did not observe a significant difference in standard deviations of protein length between proteins belonging to annotated versus Model 1 random mammalian complexes. It may still prove useful for the separation between real and erroneous complexes when combined with other properties.</p>
         </sec>
         <sec>
            <st>
               <p>Comparison with pairwise protein interactions</p>
            </st>
            <p>The overlap between binary protein-protein and predicted domain-domain interactions with proteins in our complexes was assessed (Figure <figr fid="F4">4</figr>). On average, 57%, 46% and 71% of the proteins found in the complexes (of 3 or more proteins) can be explained by known binary protein-protein, predicted domain-domain or either type of interactions (see Methods), respectively. The entire annotated protein complement of 24%, 10%, and 29% of these complexes can be explained by binary, domain-domain or either type of interactions, respectively. In addition we find that 14% of binary protein-protein interactions can be explained by domain-domain interactions which is in the range of 4&#8211;19% identified by Schuster-Bockler &amp; Bateman <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Coverage by binary domain and protein interactions</p>
               </caption>
               <text>
                  <p><b>Coverage by binary domain and protein interactions</b>. Coverage is indicated by values in the Venn diagrams. Example: A) Protein content coverage. 71% of the proteins in our complexes with 3 or more unique proteins can be explained by either domain-domain or binary protein interactions. The full protein content of 29% of these complexes can be explained by either interaction-type. 14% of binary ppi can be explained by predicted domain-domain interactions. B) Interaction coverage. 5% of IntAct binary interactions could be explained from predicted domain-domain interactions. 77% of solved protein-protein contacts in our complexes of known structure with 3 or more unique proteins can be explained by either domain-domain or binary protein interactions. All solved contacts in 52% of these complexes can likewise be explained by these interactions.</p>
               </text>
               <graphic file="1471-2164-9-629-4"/>
            </fig>
            <p>192 PDB structures are available for our complexes (103 of which consist of at least 3 different proteins). A large proportion of these structures are solved with protein fragments rather than the full-length proteins. Many of the interactions between peptides in these structures (see Methods) are supported by binary protein-protein interactions. The IntAct interaction set (excluding interactions derived only from NMR or X-ray diffraction) covered on average ~40% of detected interactions in a given complex containing PDB structure. Interactions in 34 (18%) PDB structures were fully explained by these IntAct binary interactions. A similar coverage (Figure <figr fid="F4">4B</figr>: 45% mean interaction coverage; 13% of complexes with all interactions fully explained) is provided by these IntAct binary interactions even if we consider only complexes with 3 or more distinct interacting peptides. In contrast, on average 53% of interactions in complexes with 3 or more distinct interacting proteins are explained by predicted domain-domain interactions. Predicted domain-domain interactions explain all interactions in about 25% of such complexes. Our results suggest that known protein-protein and domain-domain interactions can aid substantially in predicting interactions in our complex data. Many of these binary and domain-domain interaction defined protein pairs may be subcomplex precursors of the mammalian complexes which form during the course of assembly. Some of these subcomplex precursors might be functional complexes in current mammalian and ancestral organisms <abbrgrp><abbr bid="B62">62</abbr></abbrgrp>.</p>
            <p>Considering binary protein-protein interaction pairs in IntAct, those found in our complexes, and those derived from contacts in PDB structures associated with our mammalian complexes, we found that larger proteins tend to have larger length differences with their interacting partners (Figure <figr fid="F5">5</figr>, [Additional file <supplr sid="S15">15</supplr>]). For example, a large protein of length 5000 amino acids was more likely to be found interacting with a protein of ~1000 amino acids (a 4000 amino acid difference) rather than another protein of 5000 amino acids. However, a protein of length 300 amino acids often was found interacting with another protein of similar size. A number of reasons can explain this observation. First, the length distribution of the proteins is skewed such that relatively long proteins tend to be rare (Figure <figr fid="F2">2A</figr>). Second, on average shorter genes appear to be more abundantly expressed <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp> than longer genes. Thus, relatively large proteins may have a greater chance to encounter shorter proteins rather than longer proteins. The observation that many complex complexes tend to be composed of proteins with a shorter mean length may also be related to this phenomenon since the evolution of large complexes may depend on how often and easy it is to bring together undamaged components. The relatively low <it>dN/dS </it>ratios of genes from highly complex complexes may also be associated with this phenomenon (Figure <figr fid="F3">3D</figr>). Interestingly, similar observations (fitting even better to the straight line) were made with random protein-protein interactions (generated by picking proteins in each interaction pair randomly with replacement) from the IntAct data (Figure <figr fid="F5">5B</figr>). The relative low abundance of relatively large proteins in both the real and random interaction data can explain the trends in Figure <figr fid="F5">5A&#8211;C</figr>. The differences between real (Figure <figr fid="F5">5A, C</figr>) and random (Figure <figr fid="F5">5B</figr>) plots might be attributed to historical, selective constraints or experimental error on certain protein-protein interactions. Binned plots of Figure <figr fid="F5">5A</figr> are found in [Additional file <supplr sid="S15">15</supplr>].</p>
            <suppl id="S15">
               <title>
                  <p>Additional File 15</p>
               </title>
               <text>
                  <p><b>Length difference of interacting proteins.</b> Large proteins tend to interact with much smaller partners.</p>
               </text>
               <file name="1471-2164-9-629-S15.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Large proteins tend to interact with relatively smaller partners</p>
               </caption>
               <text>
                  <p><b>Large proteins tend to interact with relatively smaller partners</b>. For each protein pair of different proteins, the length of the larger protein (protein1) is plotted on the x-axis. A,B,C) The difference in length with its partner (protein2) is plotted on y-axis. Larger proteins tend to have a larger length difference with their partners compared to proteins of smaller size. We see this trend amongst A) IntAct binary protein-protein interactions and B) Random binary interactions generated from the IntAct data C) binary interactions mapped onto all collected mammalian complexes. For all plots A-C, the trends are significant (t-test: P &lt; 0.001).</p>
               </text>
               <graphic file="1471-2164-9-629-5"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Explaining evolutionary rate</p>
            </st>
            <p>In this work, we have hinted at various explanations such as the ease of complex assembly to reason why more complex complexity and participation negatively correlates with our measures of evolutionary rate. We believe that these explanations are contributing factors but clearly a systems approach <abbrgrp><abbr bid="B74">74</abbr></abbrgrp> is warranted. The ability of a protein to change sequence is related to the mutability of its encoding gene, its subsequent expression, the consequences of errors in the gene's products which is related to the magnitude of expression and finally the degradation of those products. Fitness effects for the individual and the population under historical environmental constraints needs to be taken into account to completely understand why certain sequences have been transmitted for millions of years of evolution. A challenge is to uncover which factors are more important than others in explaining evolutionary rate <abbrgrp><abbr bid="B75">75</abbr><abbr bid="B76">76</abbr><abbr bid="B77">77</abbr></abbrgrp>. Factors associated with proteins early in their expression such as transcription and translation <abbrgrp><abbr bid="B78">78</abbr></abbrgrp> error rate or more general factors such as protein abundance would affect the evolutionary rate of all proteins. However, factors which are related to later events in a protein's life cycle such as functional molecular interactions will likely explain evolutionary rate differently for different types of proteins. For example, transcription factors which bind DNA will have sequences constrained by the need to bind DNA. Such constraints would be absent for those proteins that do not bind DNA. If shorter proteins are more abundantly expressed, and more complex complexes tend to contain smaller proteins, higher expression of smaller proteins in more complex complexes could help explain our observations of lower dN/dS ratios. While expression appears to be important, the functional and non-functional <abbrgrp><abbr bid="B79">79</abbr></abbrgrp> interactions of the protein and its precursors with other proteins <abbrgrp><abbr bid="B7">7</abbr><abbr bid="B80">80</abbr></abbrgrp> or molecules most likely play a major role in defining the protein's relation to organism fitness. It can be very challenging relating evolutionary rate to these different factors, especially when some of these factors are measured with substantial noise or are unknown <abbrgrp><abbr bid="B81">81</abbr><abbr bid="B82">82</abbr></abbrgrp>. While the processes leading up to complex assembly can help explain protein evolutionary rate, there may be factors not directly related to complex formation yet to be fully accounted for. Some progress has been made in teasing apart contributions to evolutionary rate <abbrgrp><abbr bid="B83">83</abbr></abbrgrp>.</p>
            <p>Part of the reason why deriving mechanisms explaining evolutionary rate has captured so much interest is because such data is readily available from comparative genomics. However, without knowing mechanisms explaining evolutionary rate values, its significance and the utility of associated information becomes limited. In particular, its relation to protein function and disease needs to be worked out. By combining other information such as those derived from complexes, one might gain a deeper insight. For example, just knowing whether a protein complex contains a certain number of proteins or whether a protein belongs to a certain number of complexes may significantly help us predict its relation to certain fitness effects and future diseases, given information on its evolutionary rate. It has also been observed by many that proteins related to genetic diseases in OMIM <abbrgrp><abbr bid="B84">84</abbr></abbrgrp> tend to be relatively long <abbrgrp><abbr bid="B85">85</abbr><abbr bid="B86">86</abbr></abbrgrp> and it might be interesting to work out how this relates to specific sequences and structural features in the complexes.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>In conclusion, we have found relations and trends between the <it>dN/dS </it>ratio, primary sequence properties, secondary structure, complex complexity, participation and localization using large samples of protein complexes derived under certain distributions of conditions. There is a large evolutionary distance between yeast and mammals. Protein complexes and their subunits are not necessarily conserved between distant species <abbrgrp><abbr bid="B87">87</abbr></abbrgrp>. The different environments which mammals and yeast occupy may have produced different evolutionary pressure on the protein complexes. Despite these differences, many of our observations appear to be conserved for the mammalian and yeast complex data that we have. We suggest that our observations have been significantly influenced by constraints during the evolution of the complexes. Because of these constraints, numerical boundaries were discovered when we related properties such as protein length to complex complexity. Proteins at these property value boundaries are interesting because they are exceptional and possibly point to unusual pressures or homeostatic adaptations that allow for their presence in cells. For example, by studying highly complex protein complexes composed of very large proteins, one might uncover new mechanisms that allow for their assembly and the assembly of later evolved proteins. We also observed that random phenomena (as in neutral drift) from skewed origins can appear highly stable when averaged over large numbers (Ex. Figure <figr fid="F2">2B, D</figr>; Figure <figr fid="F5">5B</figr>). Compared to randomly generated phenomena, biologically-derived characteristics can appear less structured despite these circumstances (Ex. Figure <figr fid="F2">2C</figr>, Figure <figr fid="F5">5A</figr>). Our focus in this study is mainly on information about the presence of certain protein complexes. Once data on the abundance, stoichiometry and dynamics of mammalian protein and protein complexes become available on a large scale, one can obtain other views.</p>
      </sec>
      <sec>
         <st>
            <p>Competing interests</p>
         </st>
         <p>The authors declare that they have no competing interests.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>AH, SA, PW, MO organized the complex data. AK provided secondary structure predictions. NS and PP provided the protein interaction data. PS provided PDB contact data. PW, SA, AH, BG, PP, FB performed analysis. PS, AR, AK, TS, PP, FT, DF supervised the research process and manuscript preparation. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>The work was funded by the BioSapiens Network of Excellence (grant number LHSG-CT-2003-503265). We thank John Parsch for comments, Gabi Kastenmueller for help with BioRS, Brigitte Waegele for the complex data, Michael Telgkamp for figure preparation, Alexei Antonov and Werner Mewes for insightful discussion and emails. We also thank the anonymous reviewers.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Controlling oligomerization of pharmaceutical proteins</p>
            </title>
            <aug>
               <au>
                  <snm>Schein</snm>
                  <fnm>CH</fnm>
               </au>
            </aug>
            <source>Pharm Acta Helv</source>
            <pubdate>1994</pubdate>
            <volume>69</volume>
            <fpage>119</fpage>
            <lpage>126</lpage>
            <xrefbib>
               <pubid idtype="pmpid">7846082</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Protein oligomerization: how and why</p>
            </title>
            <aug>
               <au>
                  <snm>Ali</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Imperiali</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Bioorg Med Chem</source>
            <pubdate>2005</pubdate>
            <volume>13</volume>
            <fpage>5013</fpage>
            <lpage>5020</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15993087</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Parkinson's disease brain mitochondrial complex I has oxidatively damaged subunits and is functionally impaired and misassembled</p>
            </title>
            <aug>
               <au>
                  <snm>Keeney</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Xie</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Capaldi</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Bennett</snm>
                  <fnm>JP</fnm>
                  <suf>Jr</suf>
               </au>
            </aug>
            <source>J Neurosci</source>
            <pubdate>2006</pubdate>
            <volume>26</volume>
            <fpage>5256</fpage>
            <lpage>5264</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">16687518</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>FOXP3 is a homo-oligomer and a component of a supramolecular regulatory complex disabled in the human XLAAD/IPEX autoimmune disease</p>
            </title>
            <aug>
               <au>
                  <snm>Li</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Samanta</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Song</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Iacono</snm>
                  <fnm>KT</fnm>
               </au>
               <au>
                  <snm>Brennan</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Chatila</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Roncador</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Banham</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Riley</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Shen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Saouaf</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Greene</snm>
                  <fnm>MI</fnm>
               </au>
            </aug>
            <source>Int Immunol</source>
            <pubdate>2007</pubdate>
            <volume>19</volume>
            <fpage>825</fpage>
            <lpage>835</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17586580</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Structure analysis of BMP-2 type I receptor complexes reveals a mechanism of receptor inactivation in juvenile polyposis syndrome</p>
            </title>
            <aug>
               <au>
                  <snm>Kotzsch</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Nickel</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Seher</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Heinecke</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>van Geersdaele</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Herrmann</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Sebald</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Mueller</snm>
                  <fnm>TD</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2007</pubdate>
            <volume>283</volume>
            <fpage>5876</fpage>
            <lpage>5887</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18160401</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Modularity and evolutionary constraint on proteins</p>
            </title>
            <aug>
               <au>
                  <snm>Fraser</snm>
                  <fnm>HB</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>2005</pubdate>
            <volume>37</volume>
            <fpage>351</fpage>
            <lpage>352</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15750592</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Relating three-dimensional structures to protein networks provides evolutionary insights</p>
            </title>
            <aug>
               <au>
                  <snm>Kim</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Xia</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Gerstein</snm>
                  <fnm>MB</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2006</pubdate>
            <volume>314</volume>
            <fpage>1938</fpage>
            <lpage>1941</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17185604</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Quaternary structure constraints on evolutionary sequence divergence</p>
            </title>
            <aug>
               <au>
                  <snm>Fornasari</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Parisi</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Echave</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>349</fpage>
            <lpage>351</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17124181</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>CORUM: the comprehensive resource of mammalian protein complexes</p>
            </title>
            <aug>
               <au>
                  <snm>Ruepp</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Brauner</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Dunger-Kaltenbach</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Montrone</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Stransky</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Waegele</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Schmidt</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Noubibou Doudieu</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Stuempflen</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2008</pubdate>
            <volume>36</volume>
            <fpage>D646</fpage>
            <lpage>D650</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2238909</pubid>
                  <pubid idtype="pmpid" link="fulltext">17965090</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Human protein reference database&#8211;2006 update</p>
            </title>
            <aug>
               <au>
                  <snm>Mishra</snm>
                  <fnm>GR</fnm>
               </au>
               <au>
                  <snm>Suresh</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kumaran</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kannabiran</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Suresh</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Bala</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Shivakumar</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Anuradha</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Reddy</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Raghavan</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Menon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hanumanthu</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Gupta</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Upendran</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gupta</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mahesh</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jacob</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Mathew</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Chatterjee</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Arun</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Sharma</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Chandrika</snm>
                  <fnm>KN</fnm>
               </au>
               <au>
                  <snm>Deshpande</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Palvankar</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Raghavnath</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Krishnakanth</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Karathia</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Rekha</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Nayak</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Vishnupriya</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Kumar</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Nagini</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kumar</snm>
                  <fnm>GS</fnm>
               </au>
               <au>
                  <snm>Jose</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Deepthi</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Mohan</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Gandhi</snm>
                  <fnm>TK</fnm>
               </au>
               <au>
                  <snm>Harsha</snm>
                  <fnm>HC</fnm>
               </au>
               <au>
                  <snm>Deshpande</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Sarker</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Prasad</snm>
                  <fnm>TS</fnm>
               </au>
               <au>
                  <snm>Pandey</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>D411</fpage>
            <lpage>414</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1347503</pubid>
                  <pubid idtype="pmpid" link="fulltext">16381900</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>The Biomolecular Interaction Network Database and related tools 2005 update</p>
            </title>
            <aug>
               <au>
                  <snm>Alfarano</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Andrade</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Anthony</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Bahroos</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Bajec</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bantoft</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Betel</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Bobechko</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Boutilier</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Burgess</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Buzadzija</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Cavero</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>D'Abreo</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Donaldson</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Dorairajoo</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Dumontier</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Dumontier</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Earles</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Farrall</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Feldman</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Garderman</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Gong</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Gonzaga</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Grytsan</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Gryz</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Gu</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Haldorsen</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Halupa</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Haw</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hrvojic</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hurrell</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Isserlin</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Jack</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Juma</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Khan</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kon</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Konopinsky</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Le</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Ling</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Magidin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Moniakis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Montojo</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Moore</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Muskat</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ng</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Paraiso</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Parker</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Pintilie</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Pirone</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Salama</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Sgro</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Shan</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Shu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Siew</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Skinner</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Snyder</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Stasiuk</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Strumpf</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Tuekam</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Tao</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Willis</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Wolting</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wrong</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Xin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Yao</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Yates</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Pawson</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ouellette</snm>
                  <fnm>BF</fnm>
               </au>
               <au>
                  <snm>Hogue</snm>
                  <fnm>CW</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <fpage>D418</fpage>
            <lpage>D424</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">540005</pubid>
                  <pubid idtype="pmpid" link="fulltext">15608229</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Structural disorder promotes assembly of protein complexes</p>
            </title>
            <aug>
               <au>
                  <snm>Hegyi</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Schad</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Tompa</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>BMC Struct Biol</source>
            <pubdate>2007</pubdate>
            <volume>7</volume>
            <fpage>65</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2194777</pubid>
                  <pubid idtype="pmpid" link="fulltext">17922903</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Natural selection against protein aggregation on self-interacting and essential proteins in yeast, fly and worm</p>
            </title>
            <aug>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Dokholyan</snm>
                  <fnm>NV</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2008</pubdate>
            <volume>25</volume>
            <issue>8</issue>
            <fpage>1530</fpage>
            <lpage>1533</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18503047</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>An automated method for finding molecular complexes in large protein interaction networks</p>
            </title>
            <aug>
               <au>
                  <snm>Bader</snm>
                  <fnm>GD</fnm>
               </au>
               <au>
                  <snm>Hogue</snm>
                  <fnm>CW</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>4</volume>
            <fpage>2</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">149346</pubid>
                  <pubid idtype="pmpid" link="fulltext">12525261</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Predicting co-complexed protein pairs using genomic and proteomic data integration</p>
            </title>
            <aug>
               <au>
                  <snm>Zhang</snm>
                  <fnm>LV</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>King</snm>
                  <fnm>OD</fnm>
               </au>
               <au>
                  <snm>Roth</snm>
                  <fnm>FP</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2004</pubdate>
            <volume>5</volume>
            <fpage>38</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">419405</pubid>
                  <pubid idtype="pmpid" link="fulltext">15090078</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Protein complex prediction via cost-based clustering</p>
            </title>
            <aug>
               <au>
                  <snm>King</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Przulj</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Jurisica</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2004</pubdate>
            <volume>20</volume>
            <fpage>3013</fpage>
            <lpage>3020</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15180928</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Development and implementation of an algorithm for detection of protein complexes in large interaction networks</p>
            </title>
            <aug>
               <au>
                  <snm>Altaf-Ul-Amin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Shinbo</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Mihara</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kurokawa</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kanaya</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>207</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1473204</pubid>
                  <pubid idtype="pmpid" link="fulltext">16613608</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Using indirect protein interactions for the prediction of Gene Ontology functions</p>
            </title>
            <aug>
               <au>
                  <snm>Chua</snm>
                  <fnm>HN</fnm>
               </au>
               <au>
                  <snm>Sung</snm>
                  <fnm>WK</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <issue>Suppl 4</issue>
            <fpage>S8</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1892087</pubid>
                  <pubid idtype="pmpid" link="fulltext">17570151</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Discovering protein complexes in dense reliable neighborhoods of protein interaction networks</p>
            </title>
            <aug>
               <au>
                  <snm>Li</snm>
                  <fnm>XL</fnm>
               </au>
               <au>
                  <snm>Foo</snm>
                  <fnm>CS</fnm>
               </au>
               <au>
                  <snm>Ng</snm>
                  <fnm>SK</fnm>
               </au>
            </aug>
            <source>Comput Syst Bioinformatics Conf</source>
            <pubdate>2007</pubdate>
            <volume>6</volume>
            <fpage>157</fpage>
            <lpage>168</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17951821</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Identification of conserved protein complexes based on a model of protein network evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Hirsh</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Sharan</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2007</pubdate>
            <volume>23</volume>
            <fpage>e170</fpage>
            <lpage>176</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17237088</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>A human phenome-interactome network of protein complexes implicated in genetic disorders</p>
            </title>
            <aug>
               <au>
                  <snm>Lage</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Karlberg</snm>
                  <fnm>EO</fnm>
               </au>
               <au>
                  <snm>Storling</snm>
                  <fnm>ZM</fnm>
               </au>
               <au>
                  <snm>Olason</snm>
                  <fnm>PI</fnm>
               </au>
               <au>
                  <snm>Pedersen</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Rigina</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Hinsby</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Tumer</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Pociot</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Tommerup</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Moreau</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Brunak</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Nat Biotechnol</source>
            <pubdate>2007</pubdate>
            <volume>25</volume>
            <fpage>309</fpage>
            <lpage>316</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17344885</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Using protein complexes to predict phenotypic effects of gene mutation</p>
            </title>
            <aug>
               <au>
                  <snm>Fraser</snm>
                  <fnm>HB</fnm>
               </au>
               <au>
                  <snm>Plotkin</snm>
                  <fnm>JB</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>R252</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2258176</pubid>
                  <pubid idtype="pmpid" link="fulltext">18042286</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>From pull-down data to protein interaction networks and complexes with biological relevance</p>
            </title>
            <aug>
               <au>
                  <snm>Zhang</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>BH</fnm>
               </au>
               <au>
                  <snm>Karpinets</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Samatova</snm>
                  <fnm>NF</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2008</pubdate>
            <volume>24</volume>
            <fpage>979</fpage>
            <lpage>986</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18304937</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Predicting co-complexed protein pairs from heterogeneous data</p>
            </title>
            <aug>
               <au>
                  <snm>Qiu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Noble</snm>
                  <fnm>WS</fnm>
               </au>
            </aug>
            <source>PLoS Comput Biol</source>
            <pubdate>2008</pubdate>
            <volume>4</volume>
            <fpage>e1000054</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2275314</pubid>
                  <pubid idtype="pmpid" link="fulltext">18421371</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Bootstrapping the Interactome: Unsupervised Identification of Protein Complexes in Yeast</p>
            </title>
            <aug>
               <au>
                  <snm>Friedel</snm>
                  <fnm>CC</fnm>
               </au>
               <au>
                  <snm>Krumsiek</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zimmer</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>RECOMB</source>
            <pubdate>2008</pubdate>
            <volume>4955</volume>
            <fpage>3</fpage>
            <lpage>16</lpage>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Characterization and prediction of protein-protein interactions within and between complexes</p>
            </title>
            <aug>
               <au>
                  <snm>Sprinzak</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Altuvia</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Margalit</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>14718</fpage>
            <lpage>14723</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1595418</pubid>
                  <pubid idtype="pmpid" link="fulltext">17003128</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>MIPS: analysis and annotation of proteins from whole genomes in 2005</p>
            </title>
            <aug>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mayer</snm>
                  <fnm>KF</fnm>
               </au>
               <au>
                  <snm>Munsterkotter</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Noubibou</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Pagel</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Rattei</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Oesterheld</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ruepp</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Stumpflen</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>D169</fpage>
            <lpage>D172</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1347510</pubid>
                  <pubid idtype="pmpid" link="fulltext">16381839</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>CYGD: the Comprehensive Yeast Genome Database</p>
            </title>
            <aug>
               <au>
                  <snm>G&#252;ldener</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>M&#252;nsterk&#246;tter</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kastenm&#252;ller</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Strack</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>van Helden</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lemer</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Richelles</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wodak</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Garc&#237;a-Mart&#237;nez</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>P&#233;rez-Ort&#237;n</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Michael</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kaps</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Talla</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Dujon</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Andr&#233;</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Souciet</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>De Montigny</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bon</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Gaillardin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <fpage>D364</fpage>
            <lpage>D368</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">540007</pubid>
                  <pubid idtype="pmpid" link="fulltext">15608217</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>The Database of Interacting Proteins: 2004 update</p>
            </title>
            <aug>
               <au>
                  <snm>Salwinski</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>CS</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Pettit</snm>
                  <fnm>FK</fnm>
               </au>
               <au>
                  <snm>Bowie</snm>
                  <fnm>JU</fnm>
               </au>
               <au>
                  <snm>Eisenberg</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>D449</fpage>
            <lpage>D451</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308820</pubid>
                  <pubid idtype="pmpid" link="fulltext">14681454</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>MINT: the Molecular INTeraction database</p>
            </title>
            <aug>
               <au>
                  <snm>Chatraryamontri</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ceol</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Palazzi</snm>
                  <fnm>LM</fnm>
               </au>
               <au>
                  <snm>Nardelli</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Schneider</snm>
                  <fnm>MV</fnm>
               </au>
               <au>
                  <snm>Castagnoli</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Cesareni</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <volume>35</volume>
            <fpage>D572</fpage>
            <lpage>D574</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1751541</pubid>
                  <pubid idtype="pmpid" link="fulltext">17135203</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>MPact: the MIPS protein interaction resource on yeast</p>
            </title>
            <aug>
               <au>
                  <snm>G&#252;ldener</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>M&#252;nsterk&#246;tter</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Oesterheld</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Pagel</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ruepp</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>St&#252;mpflen</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>D436</fpage>
            <lpage>D441</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1347366</pubid>
                  <pubid idtype="pmpid" link="fulltext">16381906</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>The MIPS mammalian protein-protein interaction database</p>
            </title>
            <aug>
               <au>
                  <snm>Pagel</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Kovac</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Oesterheld</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Brauner</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Dunger-Kaltenbach</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Montrone</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Mark</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Stuempflen</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>Ruepp</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>832</fpage>
            <lpage>834</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15531608</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>IntAct&#8211;open source resource for molecular interaction data</p>
            </title>
            <aug>
               <au>
                  <snm>Kerrien</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Alam-Faruque</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Aranda</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Bancarz</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Bridge</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Derow</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Dimmer</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Feuermann</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Friedrichsen</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Huntley</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Kohler</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Khadake</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Leroy</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Liban</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lieftink</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Montecchi-Palazzi</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Orchard</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Risse</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Robbe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Roechert</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Thorneycroft</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Apweiler</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hermjakob</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <volume>35</volume>
            <fpage>D561</fpage>
            <lpage>D565</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1751531</pubid>
                  <pubid idtype="pmpid" link="fulltext">17145710</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>iPfam: visualization of protein-protein interactions in PDB at domain and amino acid resolutions</p>
            </title>
            <aug>
               <au>
                  <snm>Finn</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Marshall</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>410</fpage>
            <lpage>412</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15353450</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>3did: interacting protein domains of known three-dimensional structure</p>
            </title>
            <aug>
               <au>
                  <snm>Stein</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Russell</snm>
                  <fnm>RB</fnm>
               </au>
               <au>
                  <snm>Aloy</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <fpage>D413</fpage>
            <lpage>D417</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">539991</pubid>
                  <pubid idtype="pmpid" link="fulltext">15608228</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>The Universal Protein Resource (UniProt)</p>
            </title>
            <aug>
               <au>
                  <cnm>The Uniprot Consortium</cnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <volume>35</volume>
            <fpage>D193</fpage>
            <lpage>D197</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1669721</pubid>
                  <pubid idtype="pmpid" link="fulltext">17142230</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Specificity and stability in topology of protein networks</p>
            </title>
            <aug>
               <au>
                  <snm>Maslov</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sneppen</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <fpage>910</fpage>
            <lpage>913</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11988575</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Protein secondary structure prediction based on position-specific scoring matrices</p>
            </title>
            <aug>
               <au>
                  <snm>Jones</snm>
                  <fnm>DT</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1999</pubdate>
            <volume>292</volume>
            <fpage>195</fpage>
            <lpage>202</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10493868</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Improving the prediction of protein secondary structure in three and eight classes using recurrent neural networks and profiles</p>
            </title>
            <aug>
               <au>
                  <snm>Pollastri</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Przybylski</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Rost</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Baldi</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Proteins</source>
            <pubdate>2002</pubdate>
            <volume>47</volume>
            <fpage>228</fpage>
            <lpage>235</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11933069</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Ensembl 2007</p>
            </title>
            <aug>
               <au>
                  <snm>Hubbard</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Aken</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Beal</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ballester</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Caccamo</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Clarke</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Coates</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Cunningham</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Cutts</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Down</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Dyer</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Fitzgerald</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fernandez-Banet</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Graf</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Haider</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hammond</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Herrero</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Holland</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Howe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Kahari</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Keefe</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kokocinski</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Kulesha</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Lawson</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Longden</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Melsopp</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Megy</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Meidl</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ouverdin</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Parker</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Prlic</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Rice</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Rios</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Schuster</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sealy</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Severin</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Slater</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Smedley</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Spudich</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Trevanion</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Vilella</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Vogel</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wood</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Cox</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Curwen</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Durbin</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Fernandez-Suarez</snm>
                  <fnm>XM</fnm>
               </au>
               <au>
                  <snm>Flicek</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Kasprzyk</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Proctor</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Searle</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ureta-Vidal</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <volume>35</volume>
            <fpage>D610</fpage>
            <lpage>D617</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1761443</pubid>
                  <pubid idtype="pmpid" link="fulltext">17148474</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Natural history and evolutionary principles of gene duplication in fungi</p>
            </title>
            <aug>
               <au>
                  <snm>Wapinski</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Pfeffer</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Friedman</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Regev</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2007</pubdate>
            <volume>449</volume>
            <fpage>54</fpage>
            <lpage>61</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17805289</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>PAL2NAL: robust conversion of protein sequence alignments into the corresponding codon alignments</p>
            </title>
            <aug>
               <au>
                  <snm>Suyama</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Torrents</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Bork</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>W609</fpage>
            <lpage>W612</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1538804</pubid>
                  <pubid idtype="pmpid" link="fulltext">16845082</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>PAML 4: phylogenetic analysis by maximum likelihood</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <issue>8</issue>
            <fpage>1586</fpage>
            <lpage>1591</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17483113</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Adjusting for selection on synonymous sites in estimates of evolutionary distance</p>
            </title>
            <aug>
               <au>
                  <snm>Hirsh</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Fraser</snm>
                  <fnm>HB</fnm>
               </au>
               <au>
                  <snm>Wall</snm>
                  <fnm>DP</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <fpage>174</fpage>
            <lpage>177</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15371530</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Widespread positive selection in synonymous sites of mammalian genes</p>
            </title>
            <aug>
               <au>
                  <snm>Resch</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Carmel</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Mari&#241;o-Ram&#237;rez</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Ogurtsov</snm>
                  <fnm>AY</fnm>
               </au>
               <au>
                  <snm>Shabalina</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Rogozin</snm>
                  <fnm>IB</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>1821</fpage>
            <lpage>1831</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2632937</pubid>
                  <pubid idtype="pmpid" link="fulltext">17522087</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>An Introduction to BioPerl</p>
            </title>
            <aug>
               <au>
                  <snm>Stajich</snm>
                  <fnm>JE</fnm>
               </au>
            </aug>
            <source>Methods Mol Biol</source>
            <pubdate>2007</pubdate>
            <volume>406</volume>
            <fpage>535</fpage>
            <lpage>48</lpage>
            <xrefbib>
               <pubid idtype="pmpid">18287711</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Null mutations in human and mouse orthologs frequently result in different phenotypes</p>
            </title>
            <aug>
               <au>
                  <snm>Liao</snm>
                  <fnm>BY</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2008</pubdate>
            <volume>105</volume>
            <fpage>6987</fpage>
            <lpage>6992</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2383943</pubid>
                  <pubid idtype="pmpid" link="fulltext">18458337</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Profiling essential genes in human mammary cells by multiplex RNAi screening</p>
            </title>
            <aug>
               <au>
                  <snm>Silva</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Marran</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Parker</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Silva</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Golding</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Schlabach</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Elledge</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Hannon</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>Chang</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2008</pubdate>
            <volume>319</volume>
            <fpage>617</fpage>
            <lpage>620</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18239125</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>PROMPT: a protein mapping and comparison tool</p>
            </title>
            <aug>
               <au>
                  <snm>Schmidt</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>331</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1569443</pubid>
                  <pubid idtype="pmpid" link="fulltext">16817977</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Network biology: understanding the cell's functional organization</p>
            </title>
            <aug>
               <au>
                  <snm>Barabasi</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Oltvai</snm>
                  <fnm>ZN</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2004</pubdate>
            <volume>5</volume>
            <fpage>101</fpage>
            <lpage>113</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">14735121</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>Subnets of scale-free networks are not scale-free: sampling properties of networks</p>
            </title>
            <aug>
               <au>
                  <snm>Stumpf</snm>
                  <fnm>MP</fnm>
               </au>
               <au>
                  <snm>Wiuf</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>May</snm>
                  <fnm>RM</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <fpage>4221</fpage>
            <lpage>4224</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">555505</pubid>
                  <pubid idtype="pmpid" link="fulltext">15767579</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Effect of sampling on topology predictions of protein-protein interaction networks</p>
            </title>
            <aug>
               <au>
                  <snm>Han</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Bertin</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Cusick</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Vidal</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Nat Biotechnol</source>
            <pubdate>2005</pubdate>
            <volume>23</volume>
            <fpage>839</fpage>
            <lpage>844</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16003372</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>Physical and functional modularity of the protein network in yeast</p>
            </title>
            <aug>
               <au>
                  <snm>Wilhelm</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nasheuer</snm>
                  <fnm>HP</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Mol Cell Proteomics</source>
            <pubdate>2003</pubdate>
            <volume>2</volume>
            <fpage>292</fpage>
            <lpage>298</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16247890</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>Dynamic simulation of protein complex formation on a genomic scale</p>
            </title>
            <aug>
               <au>
                  <snm>Beyer</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wilhelm</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>1610</fpage>
            <lpage>1616</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15598828</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>The road to modularity</p>
            </title>
            <aug>
               <au>
                  <snm>Wagner</snm>
                  <fnm>GP</fnm>
               </au>
               <au>
                  <snm>Pavlicev</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Cheverud</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>921</fpage>
            <lpage>931</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18007649</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>eSLDB: eukaryotic subcellular localization database</p>
            </title>
            <aug>
               <au>
                  <snm>Pierleoni</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Martelli</snm>
                  <fnm>PL</fnm>
               </au>
               <au>
                  <snm>Fariselli</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Casadio</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <volume>35</volume>
            <fpage>D208</fpage>
            <lpage>212</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1669738</pubid>
                  <pubid idtype="pmpid" link="fulltext">17108361</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>MitoP2: An Integrative Tool for the Analysis of the Mitochondrial Proteome</p>
            </title>
            <aug>
               <au>
                  <snm>Elstner</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Andreoli</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ahting</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Tetko</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Klopstock</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Meitinger</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Prokisch</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Mol Biotechnol</source>
            <pubdate>2008</pubdate>
            <volume>40</volume>
            <fpage>306</fpage>
            <lpage>315</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18780189</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>From endosymbiont to host-controlled organelle: the hijacking of mitochondrial protein synthesis and metabolism</p>
            </title>
            <aug>
               <au>
                  <snm>Gabald&#243;n</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Huynen</snm>
                  <fnm>MA</fnm>
               </au>
            </aug>
            <source>PLoS Comput Biol</source>
            <pubdate>2007</pubdate>
            <volume>3</volume>
            <fpage>e219</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2062474</pubid>
                  <pubid idtype="pmpid" link="fulltext">17983265</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>Multiple pathways for sorting mitochondrial precursor proteins</p>
            </title>
            <aug>
               <au>
                  <snm>Bolender</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sickmann</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wagner</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Meisinger</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Pfanner</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>EMBO Rep</source>
            <pubdate>2008</pubdate>
            <volume>9</volume>
            <fpage>42</fpage>
            <lpage>9</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2246611</pubid>
                  <pubid idtype="pmpid" link="fulltext">18174896</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>Mitochondrial protein quality control: Implications in ageing</p>
            </title>
            <aug>
               <au>
                  <snm>Friguet</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Bulteau</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Petropoulos</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Biotechnol J</source>
            <pubdate>2008</pubdate>
            <volume>3</volume>
            <fpage>757</fpage>
            <lpage>764</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18446870</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B61">
            <title>
               <p>Estimation of diffusion coefficients of proteins</p>
            </title>
            <aug>
               <au>
                  <snm>Young</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Carroad</snm>
                  <fnm>PAL</fnm>
               </au>
               <au>
                  <snm>Bell</snm>
                  <fnm>RL</fnm>
               </au>
            </aug>
            <source>Biotechnology and Bioengineering</source>
            <pubdate>1980</pubdate>
            <volume>22</volume>
            <fpage>947</fpage>
            <lpage>955</lpage>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Assembly reflects evolution of protein complexes</p>
            </title>
            <aug>
               <au>
                  <snm>Levy</snm>
                  <fnm>ED</fnm>
               </au>
               <au>
                  <snm>Erba</snm>
                  <fnm>EB</fnm>
               </au>
               <au>
                  <snm>Robinson</snm>
                  <fnm>CV</fnm>
               </au>
               <au>
                  <snm>Teichmann</snm>
                  <fnm>SA</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2008</pubdate>
            <volume>453</volume>
            <fpage>1262</fpage>
            <lpage>1265</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18563089</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B63">
            <title>
               <p>OCPAT: an online codon-preserved alignment tool for evolutionary genomic analysis of protein coding sequences</p>
            </title>
            <aug>
               <au>
                  <snm>Liu</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Uddin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Islam</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Goodman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Grossman</snm>
                  <fnm>LI</fnm>
               </au>
               <au>
                  <snm>Romero</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Wildman</snm>
                  <fnm>DE</fnm>
               </au>
            </aug>
            <source>Source Code Biol Med</source>
            <pubdate>2007</pubdate>
            <volume>2</volume>
            <fpage>5</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2093931</pubid>
                  <pubid idtype="pmpid" link="fulltext">17877817</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B64">
            <title>
               <p>Conservation of protein-protein interactions &#8211; lessons from ascomycota</p>
            </title>
            <aug>
               <au>
                  <snm>Pagel</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2004</pubdate>
            <volume>20</volume>
            <fpage>72</fpage>
            <lpage>76</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">14746987</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>Unequal evolutionary conservation of human protein interactions in interologous networks</p>
            </title>
            <aug>
               <au>
                  <snm>Brown</snm>
                  <fnm>KR</fnm>
               </au>
               <au>
                  <snm>Jurisica</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>R95</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1929159</pubid>
                  <pubid idtype="pmpid" link="fulltext">17535438</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>Accelerated evolutionary rate may be responsible for the emergence of lineage-specific genes in ascomycota</p>
            </title>
            <aug>
               <au>
                  <snm>Cai</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Woo</snm>
                  <fnm>PC</fnm>
               </au>
               <au>
                  <snm>Lau</snm>
                  <fnm>SK</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>DK</fnm>
               </au>
               <au>
                  <snm>Yuen</snm>
                  <fnm>KY</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>2006</pubdate>
            <volume>63</volume>
            <fpage>1</fpage>
            <lpage>11</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16755356</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B67">
            <title>
               <p>Whole proteome pI values correlate with subcellular localizations of proteins for organisms within the three domains of life</p>
            </title>
            <aug>
               <au>
                  <snm>Schwartz</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ting</snm>
                  <fnm>CS</fnm>
               </au>
               <au>
                  <snm>King</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2001</pubdate>
            <volume>11</volume>
            <fpage>703</fpage>
            <lpage>709</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11337469</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>Evolution of protein complexes by duplication of homomeric interactions</p>
            </title>
            <aug>
               <au>
                  <snm>Pereira-Leal</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Levy</snm>
                  <fnm>ED</fnm>
               </au>
               <au>
                  <snm>Kamp</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Teichmann</snm>
                  <fnm>SA</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>R51</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1895999</pubid>
                  <pubid idtype="pmpid" link="fulltext">17411433</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p>Protein subcellular localization prediction based on compartment-specific features and structure conservation</p>
            </title>
            <aug>
               <au>
                  <snm>Su</snm>
                  <fnm>EC</fnm>
               </au>
               <au>
                  <snm>Chiu</snm>
                  <fnm>HS</fnm>
               </au>
               <au>
                  <snm>Lo</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hwang</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Sung</snm>
                  <fnm>TY</fnm>
               </au>
               <au>
                  <snm>Hsu</snm>
                  <fnm>WL</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>330</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2040162</pubid>
                  <pubid idtype="pmpid" link="fulltext">17825110</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B70">
            <title>
               <p>The coordinated evolution of yeast proteins is constrained by functional modularity</p>
            </title>
            <aug>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Dokholyan</snm>
                  <fnm>NV</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <fpage>416</fpage>
            <lpage>419</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16797778</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>Reuse of structural domain-domain interactions in protein networks</p>
            </title>
            <aug>
               <au>
                  <snm>Schuster-Bockler</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>259</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1940023</pubid>
                  <pubid idtype="pmpid" link="fulltext">17640363</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>The signature of selection mediated by expression on human genes</p>
            </title>
            <aug>
               <au>
                  <snm>Urrutia</snm>
                  <fnm>AO</fnm>
               </au>
               <au>
                  <snm>Hurst</snm>
                  <fnm>LD</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <fpage>2260</fpage>
            <lpage>2264</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">403694</pubid>
                  <pubid idtype="pmpid" link="fulltext">12975314</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>Selection for the miniaturization of highly expressed genes</p>
            </title>
            <aug>
               <au>
                  <snm>Li</snm>
                  <fnm>SW</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Niu</snm>
                  <fnm>DK</fnm>
               </au>
            </aug>
            <source>Biochem Biophys Res Commun</source>
            <pubdate>2007</pubdate>
            <volume>360</volume>
            <fpage>586</fpage>
            <lpage>592</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17610841</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B74">
            <title>
               <p>Evolutionary systems biology: links between gene evolution and function</p>
            </title>
            <aug>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
               <au>
                  <snm>Wolf</snm>
                  <fnm>YI</fnm>
               </au>
            </aug>
            <source>Curr Opin Biotechnol</source>
            <pubdate>2006</pubdate>
            <volume>17</volume>
            <fpage>481</fpage>
            <lpage>487</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16962765</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B75">
            <title>
               <p>The causes of protein evolutionary rate variation</p>
            </title>
            <aug>
               <au>
                  <snm>McInerney</snm>
                  <fnm>JO</fnm>
               </au>
            </aug>
            <source>Trends Ecol Evol</source>
            <pubdate>2006</pubdate>
            <volume>21</volume>
            <fpage>230</fpage>
            <lpage>232</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16697908</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B76">
            <title>
               <p>An integrated view of protein evolution</p>
            </title>
            <aug>
               <au>
                  <snm>P&#225;l</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Papp</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Lercher</snm>
                  <fnm>MJ</fnm>
               </au>
            </aug>
            <source>Nature Rev Genet</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <issue>5</issue>
            <fpage>337</fpage>
            <lpage>348</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pubmed">16619049</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B77">
            <title>
               <p>The quest for the universals of protein evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Rocha</snm>
                  <fnm>EP</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <fpage>412</fpage>
            <lpage>416</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16808987</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B78">
            <title>
               <p>Mistranslation-induced protein misfolding as a dominant constraint on coding-sequence evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Drummond</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Wilke</snm>
                  <fnm>CO</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>2008</pubdate>
            <volume>134</volume>
            <fpage>341</fpage>
            <lpage>352</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18662548</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B79">
            <title>
               <p>Constraints imposed by non-functional protein-protein interactions on gene expression and proteome size</p>
            </title>
            <aug>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Maslov</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Shakhnovich</snm>
                  <fnm>EI</fnm>
               </au>
            </aug>
            <source>Mol Syst Biol</source>
            <pubdate>2008</pubdate>
            <volume>4</volume>
            <fpage>210</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2538908</pubid>
                  <pubid idtype="pmpid" link="fulltext">18682700</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B80">
            <title>
               <p>Evolutionary rate in the protein interaction network</p>
            </title>
            <aug>
               <au>
                  <snm>Fraser</snm>
                  <fnm>HB</fnm>
               </au>
               <au>
                  <snm>Hirsh</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Steinmetz</snm>
                  <fnm>LM</fnm>
               </au>
               <au>
                  <snm>Scharfe</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Feldman</snm>
                  <fnm>MW</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <fpage>750</fpage>
            <lpage>752</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11976460</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B81">
            <title>
               <p>Assessing the determinants of evolutionary rates in the presence of noise</p>
            </title>
            <aug>
               <au>
                  <snm>Plotkin</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Fraser</snm>
                  <fnm>HB</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>1113</fpage>
            <lpage>1121</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17347158</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B82">
            <title>
               <p>Understanding relationship between sequence and functional evolution in yeast proteins</p>
            </title>
            <aug>
               <au>
                  <snm>Kim</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Yi</snm>
                  <fnm>SV</fnm>
               </au>
            </aug>
            <source>Genetica</source>
            <pubdate>2007</pubdate>
            <volume>131</volume>
            <fpage>151</fpage>
            <lpage>156</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17160620</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B83">
            <title>
               <p>Comparable contributions of structural-functional constraints and expression level to the rate of protein sequence evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Wolf</snm>
                  <fnm>MY</fnm>
               </au>
               <au>
                  <snm>Wolf</snm>
                  <fnm>YI</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
            </aug>
            <source>Biol Direct</source>
            <pubdate>2008</pubdate>
            <volume>3</volume>
            <fpage>40</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2572155</pubid>
                  <pubid idtype="pmpid" link="fulltext">18840284</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B84">
            <title>
               <p>Online Mendelian Inheritance in Man (OMIM), a knowledgebase of human genes and genetic disorders</p>
            </title>
            <aug>
               <au>
                  <snm>Hamosh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Scott</snm>
                  <fnm>AF</fnm>
               </au>
               <au>
                  <snm>Amberger</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Bocchini</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>McKusick</snm>
                  <fnm>VA</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <fpage>D514</fpage>
            <lpage>D517</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">539987</pubid>
                  <pubid idtype="pmpid" link="fulltext">15608251</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B85">
            <title>
               <p>Are splicing mutations the most frequent cause of hereditary disease?</p>
            </title>
            <aug>
               <au>
                  <snm>L&#243;pez-Bigas</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Audit</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ouzounis</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Parra</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Guig&#243;</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>FEBS Lett</source>
            <pubdate>2005</pubdate>
            <volume>579</volume>
            <fpage>1900</fpage>
            <lpage>1903</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15792793</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B86">
            <title>
               <p>Designability, aggregation propensity and duplication of disease-associated proteins</p>
            </title>
            <aug>
               <au>
                  <snm>Wong</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Fritz</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Frishman</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Protein Eng Des Sel</source>
            <pubdate>2005</pubdate>
            <volume>18</volume>
            <fpage>503</fpage>
            <lpage>508</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16155116</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B87">
            <title>
               <p>Protein-protein interactions more conserved within species than across species</p>
            </title>
            <aug>
               <au>
                  <snm>Mika</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Rost</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>PLoS Comput Biol</source>
            <pubdate>2006</pubdate>
            <volume>2</volume>
            <fpage>e79</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1513270</pubid>
                  <pubid idtype="pmpid" link="fulltext">16854211</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
