<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-8-51</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>A genomic survey of the fish parasite <it>Spironucleus salmonicida </it>indicates genomic plasticity among diplomonads and significant lateral gene transfer in eukaryote genome evolution</p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Andersson</snm>
               <mi>O</mi>
               <fnm>Jan</fnm>
               <insr iid="I1"/>
               <email>jan.andersson@icm.uu.se</email>
            </au>
            <au id="A2">
               <snm>Sj&#246;gren</snm>
               <mi>M</mi>
               <fnm>&#197;sa</fnm>
               <insr iid="I2"/>
               <insr iid="I6"/>
               <email>asa.sjogren@mikrob.slu.se</email>
            </au>
            <au id="A3">
               <snm>Horner</snm>
               <mi>S</mi>
               <fnm>David</fnm>
               <insr iid="I3"/>
               <insr iid="I7"/>
               <email>david.horner@unimi.it</email>
            </au>
            <au id="A4">
               <snm>Murphy</snm>
               <mi>A</mi>
               <fnm>Colleen</fnm>
               <insr iid="I4"/>
               <email>colleen.murphy@nrc-cnrc.gc.ca</email>
            </au>
            <au id="A5">
               <snm>Dyal</snm>
               <mi>L</mi>
               <fnm>Patricia</fnm>
               <insr iid="I3"/>
               <email>pd@nhm.ac.uk</email>
            </au>
            <au id="A6">
               <snm>Sv&#228;rd</snm>
               <mi>G</mi>
               <fnm>Staffan</fnm>
               <insr iid="I1"/>
               <email>staffan.svard@icm.uu.se</email>
            </au>
            <au id="A7">
               <snm>Logsdon</snm>
               <mi>M</mi>
               <fnm>John</fnm>
               <suf>Jr</suf>
               <insr iid="I5"/>
               <email>john-logsdon@uiowa.edu</email>
            </au>
            <au id="A8">
               <snm>Ragan</snm>
               <mi>A</mi>
               <fnm>Mark</fnm>
               <insr iid="I4"/>
               <insr iid="I8"/>
               <email>m.ragan@imb.uq.edu.au</email>
            </au>
            <au id="A9">
               <snm>Hirt</snm>
               <mi>P</mi>
               <fnm>Robert</fnm>
               <insr iid="I3"/>
               <insr iid="I9"/>
               <email>r.p.hirt@ncl.ac.uk</email>
            </au>
            <au id="A10">
               <snm>Roger</snm>
               <mi>J</mi>
               <fnm>Andrew</fnm>
               <insr iid="I2"/>
               <email>andrew.roger@dal.ca</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Institute of Cell and Molecular Biology, Uppsala University, Biomedical Center, Uppsala, Sweden</p>
            </ins>
            <ins id="I2">
               <p>The Canadian Institute for Advanced Research, Program in Evolutionary Biology, Department of Biochemistry and Molecular Biology, Dalhousie University, Halifax, Nova Scotia, Canada</p>
            </ins>
            <ins id="I3">
               <p>Department of Zoology, The Natural History Museum, London, UK</p>
            </ins>
            <ins id="I4">
               <p>Institute for Marine Biosciences, National Research Council of Canada, Halifax, Nova Scotia, Canada</p>
            </ins>
            <ins id="I5">
               <p>Roy J. Carver Center for Comparative Genomics, Department of Biological Sciences, University of Iowa, Iowa City, USA</p>
            </ins>
            <ins id="I6">
               <p>Department of Microbiology, Swedish University of Agricultural Sciences, Uppsala, Sweden</p>
            </ins>
            <ins id="I7">
               <p>Dipartimento di Scienze Biomolecolare e Biotecnologie, University of Milan, Milan, Italy</p>
            </ins>
            <ins id="I8">
               <p>ARC Centre in Bioinformatics, and Institute for Molecular Bioscience, The University of Queensland, Brisbane, Australia</p>
            </ins>
            <ins id="I9">
               <p>School of Biology, The Devonshire building, The University of Newcastle upon Tyne, UK</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2007</pubdate>
         <volume>8</volume>
         <issue>1</issue>
         <fpage>51</fpage>
         <url>http://www.biomedcentral.com/1471-2164/8/51</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17298675</pubid>
               <pubid idtype="doi">10.1186/1471-2164-8-51</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>22</day>
               <month>9</month>
               <year>2006</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>14</day>
               <month>2</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>14</day>
               <month>2</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Andersson et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Comparative genomic studies of the mitochondrion-lacking protist group Diplomonadida (diplomonads) has been lacking, although <it>Giardia lamblia </it>has been intensively studied. We have performed a sequence survey project resulting in 2341 expressed sequence tags (EST) corresponding to 853 unique clones, 5275 genome survey sequences (GSS), and eleven finished contigs from the diplomonad fish parasite <it>Spironucleus salmonicida </it>(previously described as <it>S. barkhanus</it>).</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The analyses revealed a compact genome with few, if any, introns and very short 3' untranslated regions. Strikingly different patterns of codon usage were observed in genes corresponding to frequently sampled ESTs versus genes poorly sampled, indicating that translational selection is influencing the codon usage of highly expressed genes. Rigorous phylogenomic analyses identified 84 genes &#8211; mostly encoding metabolic proteins &#8211; that have been acquired by diplomonads or their relatively close ancestors via lateral gene transfer (LGT). Although most acquisitions were from prokaryotes, more than a dozen represent likely transfers of genes between eukaryotic lineages. Many genes that provide novel insights into the genetic basis of the biology and pathogenicity of this parasitic protist were identified including 149 that putatively encode variant-surface cysteine-rich proteins which are candidate virulence factors. A number of genomic properties that distinguish <it>S. salmonicida </it>from its human parasitic relative <it>G. lamblia </it>were identified such as nineteen putative lineage-specific gene acquisitions, distinct mutational biases and codon usage and distinct polyadenylation signals.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>Our results highlight the power of comparative genomic studies to yield insights into the biology of parasitic protists and the evolution of their genomes, and suggest that genetic exchange between distantly-related protist lineages may be occurring at an appreciable rate in eukaryote genome evolution.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="bmc" subtype="user_supplied_xml" id="endnote"/>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Diplomonads are a diverse group of small mitochondrion-lacking diplokaryotic flagellates found in anaerobic or micro-aerophilic environments <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Most research on diplomonads has focused on <it>Giardia lamblia </it>(syn. <it>Giardia intestinalis</it>, <it>Giardia duodenalis</it>), which is a major cause of water-borne enteric disease in humans in both industrialised and developing countries <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>. However, there are important variations in lifestyles among diplomonads; although many are endocommensals or parasites associated with animals, there are also several free-living species, mainly within the genera <it>Trepomonas </it>and <it>Hexamita</it>, that are found in aquatic environments rich in organic matter and deficient in oxygen <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. Most members of the genus <it>Spironucleus </it>are parasites, typically of fish but also of birds and mice; several <it>Spironucleus </it>species have been shown to cause disease in their hosts <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>, although essentially nothing is known about the virulence mechanisms of <it>Spironucleus </it>species. <it>Spironucleus salmonicida</it>, the focus of this study, can cause systemic and organ infections in cultivated salmon, posing a significant problem for the aquaculture industry <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr></abbrgrp>. This isolate was previously known as <it>Spironucleus barkhanus </it><abbrgrp><abbr bid="B5">5</abbr></abbrgrp>, but pathogenic isolates of this species were recently redescribed as <it>S. salmonicida </it>to distinguish them from morphologically identical, but genetically distinct, fish commensal isolates of <it>S. barkhanus </it><abbrgrp><abbr bid="B6">6</abbr></abbrgrp>.</p>
         <p>Diplomonads were once thought to belong to the earliest-diverging lineage within the eukaryotes <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. Accordingly, they were described as 'biological fossils', true eukaryotes with many peculiarities (e.g. two nuclei, different genetic code, lack of aerobic mitochondria) that retained some ancestral prokaryotic properties <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>. However, advances in molecular phylogenetics and cell biology during the last decade strongly suggest this view is incorrect <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>. The current interpretation of the phylogeny of eukaryotes lends no support for diplomonads as the earliest eukaryotic branch <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. Indeed, a sister-group relationship between diplomonads and parabasalids to the exclusion of other eukaryotic lineages and the root has recently been demonstrated, based both on phylogenetic analysis of concatenated protein-coding sequences <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr></abbrgrp>, and on shared gene acquisitions <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr></abbrgrp>. Diplomonads and parabasalids are now classified within the eukaryotic supergroup Excavata <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. Furthermore, diplomonads seem to have all features previously thought to be lacking in "primitive" eukaryotes, including an organelle with mitochondrial ancestry (mitosome) <abbrgrp><abbr bid="B19">19</abbr></abbrgrp> and intron-containing genes <abbrgrp><abbr bid="B20">20</abbr><abbr bid="B21">21</abbr></abbrgrp>, while some prokaryotic properties are probably the result of lateral gene transfers from the prokaryotic realm <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>.</p>
         <p>Recently, enteromonads (monokaryotic protists traditionally regarded as closely related to diplomonads) were surprisingly found to branch robustly with <it>Trepomonas </it>and <it>Hexamita </it>in phylogenetic analyses to the exclusion of <it>Spironucleus </it><abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. These results suggest that the diplokaryotic state of diplomonads arose multiple times independently, or that the monokaryon of enteromonads is a derived feature. Large genetic and biological variation also exists within diplomonads. For example, <it>Spironucleus</it>, <it>Trepomonas </it>and <it>Hexamita</it>, form a monophyletic clade to the exclusion of <it>Giardia </it>in phylogenetic trees <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>, and use an alternative genetic code whereby TAA and TAG, rather than being stop codons, encode glutamine <abbrgrp><abbr bid="B25">25</abbr><abbr bid="B26">26</abbr></abbrgrp>.</p>
         <p>To gain insights into the evolutionary history and genomic architecture of diplomonads in general and <it>Spironucleus </it>in particular, we initiated a genome survey project in <it>S. salmonicida</it>. To maximize gene discovery we obtained expressed sequence tag (EST) and genomic survey sequences (GSS), and completely sequenced eleven contigs. Here, we present analyses of the complete set of sequences obtained in the genome survey project. Although we present data that only partially covers the <it>S. salmonicida </it>genome, these data provide key insights into the genome-level properties of <it>S. salmonicida </it>such as its coding content, base compositional biases, gene content, gene architecture, and patterns of gene acquisitions. From these analyses, we are able to make inferences about the biology of a poorly-understood fish parasite, as well as gain a first glimpse into genome evolution within the enigmatic protist phylum Diplomonadida.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>The first sequence data from <it>Spironucleus </it>on the genomic level</p>
            </st>
            <p>This sequence survey of <it>S. salmonicida </it>has been the starting point for several projects regarding different aspects of the genetics and molecular evolution of this diplomonad <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr><abbr bid="B33">33</abbr></abbrgrp>. Together with a few other studies, these have resulted in about thirty <it>S. salmonicida </it>genes in the public databases. The present analysis of the complete set of 2408 EST and 5275 GSS sequences, combined with a the complete sequence of eleven contigs corresponding to 80 kbp unique sequence (Additional file <supplr sid="S1">1</supplr>), extend this information to include 1738 unique protein coding genes, two ribosomal RNA genes and 20 tRNA genes (Table <tblr tid="T1">1</tblr> and Additional file <supplr sid="S2">2</supplr>). Altogether our sequence data cover more than 2.5 Mbp of the <it>S. salmonicida </it>genome. The only genome size reported from a diplomonad is 12 Mbp for the genome of <it>G. lamblia </it><abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. The genome size of <it>S. salmonicida </it>is unknown, but the degree of sequence overlap between independent clones in our random genomic shotgun library yielded a very rough estimate of approximately 7 Mbp of unique sequence (see Methods for details of the calculation). Interestingly, the observation that 33% of the EST sequences have matches within the GSS sequences suggests a genome size in a similar range, unless the same genes are preferentially cloned in both the EST and GSS sequences. Thus, there are no indications within our sequence survey project that the <it>S. salmonicida </it>genome is larger than the <it>G. lamblia </it>genome. These observations indicate that our obtained sequences potentially represent one third of the complete genome.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Summary of genes detected in the <it>S. salmonicida </it>genome.</p>
               </caption>
               <tblbdy cols="6">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>EST</p>
                     </c>
                     <c ca="center">
                        <p>GSS</p>
                     </c>
                     <c ca="center">
                        <p>contigs</p>
                     </c>
                     <c ca="center">
                        <p>published</p>
                     </c>
                     <c ca="center">
                        <p>TOTAL</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="6">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cellular processes</p>
                     </c>
                     <c ca="center">
                        <p>26</p>
                     </c>
                     <c ca="center">
                        <p>46</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>74</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Cell communication</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Cell growth and death</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Cell motility</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Development</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>unclassified</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>24</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>39</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Environmental information processing</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>53</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>92</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Ligand-receptor interaction</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Membrane transport</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Signal transduction</p>
                     </c>
                     <c ca="center">
                        <p>28</p>
                     </c>
                     <c ca="center">
                        <p>44</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>73</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>unclassified</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genetic information processing</p>
                     </c>
                     <c ca="center">
                        <p>126</p>
                     </c>
                     <c ca="center">
                        <p>58</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>189</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Folding, sorting and degradation</p>
                     </c>
                     <c ca="center">
                        <p>30</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>47</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Replication and repair</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Transcription</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Translation</p>
                     </c>
                     <c ca="center">
                        <p>82</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>96</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>unclassified</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Metabolism</p>
                     </c>
                     <c ca="center">
                        <p>99</p>
                     </c>
                     <c ca="center">
                        <p>110</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>21</p>
                     </c>
                     <c ca="center">
                        <p>236</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Amino acid metabolism</p>
                     </c>
                     <c ca="center">
                        <p>17</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Carbohydrate metabolism</p>
                     </c>
                     <c ca="center">
                        <p>28</p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>67</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Energy metabolism</p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Glycan biosynthesis and metabolism</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Lipid metabolism</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Metabolism of cofactors and vitamins</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Metabolism of other amino acids</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>Nucleotide metabolism</p>
                     </c>
                     <c ca="center">
                        <p>19</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>60</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left" indent="1">
                        <p>unclassified</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Conserved hypothetical protein</p>
                     </c>
                     <c ca="center">
                        <p>189</p>
                     </c>
                     <c ca="center">
                        <p>528</p>
                     </c>
                     <c ca="center">
                        <p>15</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>732</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hypothetical protein</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Ribosomal RNA</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>tRNA</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="6">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="center">
                        <p>473</p>
                     </c>
                     <c ca="center">
                        <p>817</p>
                     </c>
                     <c ca="center">
                        <p>40</p>
                     </c>
                     <c ca="center">
                        <p>27</p>
                     </c>
                     <c ca="center">
                        <p>1357</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p>A table showing the characteristics of the finished contigs.</p>
               </text>
               <file name="1471-2164-8-51-S1.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p>Complete list of gene annotations.</p>
               </text>
               <file name="1471-2164-8-51-S2.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Variable G+C content along the genome</p>
            </st>
            <p>On the whole, the <it>S. salmonicida </it>genome was found to be G+C poor; the average G+C contents were 35.9%, and 39.3% within the 5070 GSSs and the eleven finished sequences, respectively. However, the eleven finished contigs showed large variation in G+C content, with average G+C contents ranging from 24.9% to 58.3% (named Sp1-11, Figure <figr fid="F1">1</figr>). This probably cannot be explained by the presence within each contig of genes with the higher values; the coding content of Sp2 is 96% and its G+C content is only 31%, while the coding content of Sp8 is 75% and its G+C content is 58% (Additional file <supplr sid="S1">1</supplr>). In fact, the G+C content sometimes varies drastically within each contig. For example, the average G+C content in the region between 1&#8211;5 kbp from the 5' end of Sp1 is around 30%, while between 6&#8211;11 kbp its G+C content is almost 70% (Figure <figr fid="F1">1</figr>). Similar sharp shifts in G+C content along the genome are observed in some other contigs (e.g. Sp7, Sp10, and Sp11: Figure <figr fid="F1">1</figr>). These shifts in G+C content do not seem to be correlated with the presence and absence of genes: both G+C rich and poor regions are fairly dense with genes, with the exception of the G+C poor contig Sp4 and the 5' end of Sp9. However, these observations are consistent with the existence of different mutational biases in different regions of the <it>S. salmonicida </it>genome; the G+C contents of both the third synonymous position of protein coding genes and the non-coding regions varies as expected if mutational bias shapes the G+C content <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>, with the GC3 values of genes higher than the average G+C content for genes in G+C rich regions and lower in G+C poor regions (Figure <figr fid="F1">1</figr>). A similar pattern is observed for non-coding regions (Additional file <supplr sid="S1">1</supplr>), and the codon usage analysis indicates large variations of the G+C contents among genes (see below).</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>A plot of G+C content along the eleven finished contigs</p>
               </caption>
               <text>
                  <p><b>A plot of G+C content along the eleven finished contigs</b>. G+C content calculated in 500-bp sliding windows in 50-bp steps along the finished contigs. The marks on the x axis indicate 1 kbp. Black lines, dark grey and light grey lines indicate annotated genes with sequence similarities in the public databases, hypothetical genes with matches in the EST data, and hypothetical genes without matches in the public databases or EST data, respectively. The position of the line on the y axis indicates the GC3<sub>s </sub>value of the gene, an arrow indicates its direction (strand), and the annotated gene function is indicated. Average genomic G+C contents in the GSS clones are indicated by a dotted line. The order of the contigs is arbitrary.</p>
               </text>
               <graphic file="1471-2164-8-51-1"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p><it>S. salmonicida </it>has a compact genome</p>
            </st>
            <p>Analysis of the eleven completely sequenced contigs showed that the coding density varies significantly between contigs (Figure <figr fid="F1">1</figr> and Additional file <supplr sid="S1">1</supplr>). Some parts of the genome appear to be very gene-dense, with short intergenic regions. In fact, six cases of putative overlapping open reading frames (ORFs) were identified, similar to earlier findings in <it>G. lamblia </it><abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. The lengths of the overlapping regions range from 1 to 101 bp; in four cases they are encoded in the same direction, while in the other two cases the 5' regions overlap. Experimental studies are needed to determine which initiation codons actually are used in these putative genes to determine if they are truly overlapping transcribed ORFs that encode functional proteins. Nevertheless, the whole genome does not seem to be packed with genes; no protein coding sequence could be detected in the almost 5-kbp contig Sp4, nor in a long region upstream of the 18S ribosomal RNA gene in Sp9 (Figure <figr fid="F1">1</figr>). In <it>G. lamblia</it>, the genes for ribosomal RNA have been found to be associated with telomeres <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. However, we were unable to detect any sequence similarity to genes that are associated with telomeres in <it>G. lamblia</it>, or any telomere repeats, in the long region upstream of the rRNA genes in <it>S. salmonicida </it>Sp9.</p>
            <p>The transcription of protein-encoding genes in <it>Giardia </it>is atypical for eukaryotes. The promoters are short; less than 70 bp is needed for efficient expression of most genes, even if they are stage-specific <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. The 5'-UTRs of the transcripts are usually only 1&#8211;10 nt, and the genes lack TATA boxes or other <it>cis</it>-acting promoter elements characteristic of typical eukaryotic promoters; AT-rich sequences around the <it>G. lamblia </it>ATG initiation codons determine the transcriptional start site and are essential and sufficient for promoter activity <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>. The <it>S. salmonicida </it>promoters apparently lack TATA-boxes and other typical eukaryotic promoter motifs (Figure <figr fid="F2">2A</figr>). However, AT-rich stretches are found close to the translational start sites, or in the first 50 bp upstream (Figure <figr fid="F2">2A</figr>) and the intergenic regions are very short (Figure <figr fid="F1">1</figr>). Thus, the <it>S. salmonicida </it>transcriptional machinery appears to resemble the 'atypical' machinery previously characterized in <it>G. lamblia </it><abbrgrp><abbr bid="B39">39</abbr></abbrgrp>.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>5' and 3' untranslated regions in <it>S. salmonicida</it></p>
               </caption>
               <text>
                  <p><b>5' and 3' untranslated regions in <it>S. salmonicida</it></b>. A: 5' regions of full-length genes from the completely sequenced contigs. The initiation codons of nine genes in the contigs (Figure 1) could be precisely identified based on sequence conservation compared to orthologs. The 5' sequences are aligned based on the initiation codons (indicated by a box). B: Sequence logo [107] around the termination codon of 134 <it>Spironucleus </it>cDNA sequences.</p>
               </text>
               <graphic file="1471-2164-8-51-2"/>
            </fig>
            <p>The position of the polyA tail in relation to the termination codon could be mapped in 134 EST clones. The 3' untranslated regions (UTR) of <it>S. salmonicida </it>genes appear to be short; the average distance between the termination codon and the first A in the polyA tail is 13.2 bases and in 122 of the 134 cases the distance is between 9 and 14 nucleotides (Figure <figr fid="F2">2B</figr>). Such very short 3' UTRs have previously been observed in <it>G. lamblia</it>, but this is in stark contrast to most other studied eukaryotes where 3' UTRs have been proposed to play important roles in regulating messenger RNA (mRNA) stability and translation <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. In <it>G. lamblia</it>, AGTRAAY has been identified as a consensus polyadenylation signal <abbrgrp><abbr bid="B41">41</abbr></abbrgrp>. Our analyses do not identify any strong consensus sequence outside the conserved unique termination codon TGA, although we observe a preference for A in the position two bases upstream of the termination codon, and a T immediately downstream (Figure <figr fid="F2">2B</figr>). Interestingly, the three most conserved nucleotides in the <it>G. lamblia </it>polyadenylation signals are the central TRA nucleotides, which is similar to the situation in <it>S. salmonicida</it>. Furthermore, a preference for a U-rich region close to the polyA tail is also apparent, a pattern conserved in many eukaryotes but not <it>Giardia </it><abbrgrp><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>. It has been reported that a fraction (~20%) of complementary DNAs (cDNAs) from <it>G. lamblia </it>represent polyadenylated sterile anti-sense transcripts that may result from a loose control of transcription <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. The rarity of such sterile transcripts in our cDNA library (~1% among 2341 EST) indicates that this phenomenon is not universal for diplomonads. Indeed, our data indicate considerable variation in the specificity of the transcription and polyadenylation machineries within diplomonads.</p>
            <p>The availability of both EST and genomic sequences was used to identify putative introns. An intron should be detected as a sequence gap in an alignment between the EST and the corresponding genomic sequence because the EST sequences typically represent the spliced version of the gene sequence. This approach was used to identify potential introns using similarity searches with the EST sequences as probes against the GSS and finished contig genomic sequences. 290 out of 885 ESTs matched with an e &lt; e<sup>-10 </sup>(<it>i.e.</it>, almost all were identical sequences) and manual inspection failed to detect any introns. The <it>S. salmonicida </it>genome appears to be very intron-poor. Given that only a few introns have been detected within the diplomonad <it>G. lamblia </it><abbrgrp><abbr bid="B20">20</abbr><abbr bid="B21">21</abbr></abbrgrp>, a paucity of introns could represent the ancestral state of the diplomonads. However, two introns were detected in one of the first genes sequenced from <it>Carpediemonas </it><abbrgrp><abbr bid="B44">44</abbr></abbrgrp>, an excavate taxon and possible sister lineage to diplomonads. Thus, introns may have been more frequent in a common ancestor of diplomonads and <it>Carpediemonas</it>, and that the ancestral diplomonad lineage experienced genome-wide intron loss, an evolutionary phenomenon that is not uncommon <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>. A basic spliceosomal organisation is present in <it>Giardia </it>suggesting that the spliceosome is ancestral to extant eukaryotes <abbrgrp><abbr bid="B46">46</abbr></abbrgrp>. Although our analyses did not identify any proteins likely to be involved in splicing in <it>S. salmonicida</it>, further sequencing and more detailed analyses are needed to determine whether introns and a functional spliceosomal apparatus are present in <it>S. salmonicida</it>.</p>
         </sec>
         <sec>
            <st>
               <p>Coding capacity of <it>S. salmonicida</it></p>
            </st>
            <p>In this study we have identified more than 1300 novel genes, distributed among all functional categories, representing a twenty-fold increase of the number of genes with assigned functions identified in the <it>S. salmonicida </it>genome (Table <tblr tid="T1">1</tblr>). Among these were genes involved in translation: 74 genes encoding ribosomal proteins, many translation factors, and fifteen different tRNA synthetases were identified (Additional file <supplr sid="S2">2</supplr>). Twenty tRNA genes were identified, which cover 24 of the 63 sense codons allowing for the normal wobble rules for codon-anticodon pairing. No tRNA was identified that decodes UAG or UAA codons, which encode glutamine in <it>Spironucleus</it>, although such tRNA genes have been identified previously <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Interestingly, all 64 codons appear to have the potential to code for incorporation of amino acids into proteins in <it>S. salmonicida</it>; both tRNA identification programs used in our analyses identified a putative tRNA with the anticodon UCA, annotated as a selenocysteine (Sec) tRNA. The identification of a putative Sec tRNA, which is a central component of selenoprotein biosynthesis <abbrgrp><abbr bid="B47">47</abbr></abbrgrp>, in our data set suggests that <it>Spironucleus </it>is able to use the single stop codon (UGA) to incorporate this rare amino acid into selenoproteins. Indeed, the usage of selenocysteine seems to be widespread feature in protists; Sec tRNAs have recently been identified in <it>Dictyostelium</it>, <it>Tetrahymena</it>, and <it>Plasmodium </it><abbrgrp><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr></abbrgrp>.</p>
            <p>The identified proteins within the cellular, environmental information, and genetic information process categories in our data set clearly reflect a coding potential similar to a typical eukaryote, including eukaryotic translation and transcription machineries, many proteins involved in eukaryotic signal transduction pathways, a large family of dynein proteins, and five genes encoding members of the Rab small GTPase family (Additional file <supplr sid="S2">2</supplr>). This is indeed expected from the current view of diplomonad phylogeny and cell biology (see Background section). Interestingly, only eight Rab genes were found in <it>G. lamblia</it>, while a large number of Rab GTPases were found in <it>Trichomonas vaginalis</it>, most likely related to the apparently more-complex endomembrane system in this parabasalid <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>. Two of the five Rab proteins identified in our survey lack identifiable orthologs in the <it>G. lamblia </it>genome, but branch with <it>T. vaginalis </it>Rab sequences in phylogenetic trees (data not shown), suggesting that <it>S. salmonicida </it>has retained Rab proteins that have been lost in the lineage leading to <it>G. lamblia</it>.</p>
            <p>Absences of genes are very difficult to infer from partial genome data, but some general trends may be observed. For example, relatively few enzymes involved in amino acid metabolism were detected (Additional file <supplr sid="S2">2</supplr>). Aminoacyl-tRNA synthetases are classified into this category, but they are atypical since they are essential for protein synthesis. Furthermore, only a single protein (malate dehydrogenase) associated with the tricarboxylic acid (TCA) cycle was found. However, malate dehydrogenase actually functions in a pyruvate synthesis pathway in <it>G. lamblia </it><abbrgrp><abbr bid="B2">2</abbr></abbrgrp>, rather than in the TCA cycle, suggesting a similar role in <it>S. salmonicida</it>. In contrast, several glycolytic proteins are present in our data set (Additional file <supplr sid="S2">2</supplr>). This pattern of metabolic proteins is expected from a fermentative phagotrophic heterotroph which has access to organic compounds from its host, and indeed is very similar to the pattern found in <it>Entamoeba histolytica </it><abbrgrp><abbr bid="B51">51</abbr></abbrgrp>. These similarities between <it>S. salmonicida </it>and <it>E. histoytica </it>are almost certainly due to independent adaptations to such an environment in the two lineages. Indeed, a considerable fraction of the metabolic proteins was found to be more closely related to prokaryotic rather than eukaryotic homologs in the phylogenomic analyses, suggesting acquisition of these genes by gene transfer (see further discussion below).</p>
         </sec>
         <sec>
            <st>
               <p>Does <it>S. salmonicida </it>possess mitosomes?</p>
            </st>
            <p>A new organelle, the mitosome, has recently been identified in <it>G. lamblia</it>, that is probably a remnant of a mitochondrion <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. Currently, the only known function of mitosomes in <it>Giardia </it>is iron-sulfur (Fe-S) cluster synthesis <abbrgrp><abbr bid="B52">52</abbr><abbr bid="B53">53</abbr></abbrgrp>. The phylogenetic relationship between <it>G. lamblia </it>and <it>S. salmonicida</it>, the likely mitochondrial origin of the organelle, together with mitochondria and their derived organelles currently being thought to be universally present in all extent eukaryotes <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> strongly suggest that the common ancestor of the two species contained an organelle with mitochondrial ancestry. Here we identified two strong cases of candidate mitosomal proteins in <it>S. salmonicida</it>, a chaperon GroEL (or Hsp60 or Cpn60) a key protein for mediating protein folding in mitochondria <abbrgrp><abbr bid="B28">28</abbr></abbrgrp> and a cysteine desulfurase (called Nifsp in <it>Saccharomyces cerevisiae</it>), a key enzyme of the Fe-S cluster synthesis pathway <abbrgrp><abbr bid="B54">54</abbr></abbrgrp> (Additional file <supplr sid="S2">2</supplr>). Orthologous proteins of Hsp60 and Nifsp are known to localize and function in <it>S. cerevisiae </it>mitochondria and <it>G. lamblia </it>mitosomes <abbrgrp><abbr bid="B52">52</abbr><abbr bid="B53">53</abbr></abbrgrp>. Localization studies of these two proteins should indeed be very useful to investigate whether <it>S. salmonicida </it>contains mitosomes.</p>
            <p>A full-length ORF encoding a dynamin-like protein that is found on contig Sp3 (Figure <figr fid="F1">1</figr>) is another protein potentially linked with the mitosome. The <it>G. lamblia </it>genome encodes a single dynamin-like protein and phylogenetic analyses recover the two diplomonad sequences as monophyletic (data not shown). The function of the <it>G. lamblia </it>single dynamin-like protein is currently unknown. Yet, a single dynamin-like protein encoding gene is also found in three kinetoplastid genomes (two <it>Trypanosoma </it>and one <it>Leishmania</it>) <abbrgrp><abbr bid="B55">55</abbr></abbrgrp> and the microsporidium <it>Encephalitozoon cuniculi </it><abbrgrp><abbr bid="B56">56</abbr></abbrgrp>, whereas most eukaryotic genomes encode several dynamin-like paralogues that function either in membrane trafficking or organelle division (mitochondria and plastids) <abbrgrp><abbr bid="B57">57</abbr></abbrgrp>. Interestingly, the single dynamin-like protein from <it>Trypanosoma brucei </it>was shown to be involved in mitochondrial division <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. Hence the single dynamin-like proteins in <it>Spironucleus</it>, <it>Giardia </it>and <it>Encephalitozoon </it>could all be involved in mitosome division.</p>
         </sec>
         <sec>
            <st>
               <p>A large family of cysteine-rich proteins</p>
            </st>
            <p>The predicted amino acid sequences of 149 genes were found to contain more than 10% cysteine and were classified as cysteine-rich proteins. Most of these were annotated as conserved hypothetical proteins, although some could be assigned to a functional category (Additional file <supplr sid="S2">2</supplr>). Most of the cysteine residues were found as CXXC motifs (Figure <figr fid="F3">3</figr> and data not shown). Such an arrangement is similar to the large protein family of variant-specific surface proteins (VSP) found in <it>G. lamblia </it><abbrgrp><abbr bid="B59">59</abbr></abbrgrp>, which is estimated to comprise 2.4% of the genome <abbrgrp><abbr bid="B60">60</abbr></abbrgrp>. However, less than 10% of the cysteine-rich proteins in <it>S. salmonicida </it>showed highest sequence similarities to <it>G. lamblia </it>cysteine-rich proteins, and the two conserved motifs of <it>G. lamblia </it>VSP proteins, CRGKA and GGCY <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>, were not found within any of the amino acid sequence of <it>S. salmonicida </it>cysteine-rich proteins. Indeed, in similarity searches the majority were most similar to putative proteins discovered in the ciliate <it>Tetrahymena thermophila </it>genome project (data not shown) <abbrgrp><abbr bid="B61">61</abbr></abbrgrp>. These observations indicate that diplomonads vary greatly in their cysteine-rich proteins; the gene families indeed appear to have expanded independently in the <it>Giardia </it>and <it>Spironucleus </it>lineages. The biological role of VSP proteins is not well understood, but VSP proteins are immuno-dominant in <it>G. lamblia </it>and expressed on the cell surface <abbrgrp><abbr bid="B59">59</abbr></abbrgrp>. Among the 149 cysteine-rich proteins coding sequences two are likely to represent full-length ORFs. These are strong candidate surface proteins since they possess a transmembrane (TM) domain and a cysteine-rich domain made of furin-like and/or epidermal growth factor (EGF)-like domains typical of surface or secreted proteins, a feature shared with <it>G. lamblia </it>VSPs (Figure <figr fid="F3">3</figr>). A total of 14 sequences encoding partial proteins with cysteine-rich domains possess similar structural organization as the one shown in Figure <figr fid="F3">3</figr>, i.e. they possess a TM domain with the cysteine-rich domains likely to face the extra-cellular milieu. No TM domains could be found in the remaining cysteine-rich proteins within our dataset. However, in several cases these partial cysteine-rich proteins show high similarity to cysteine-rich proteins containing TM domains, suggesting that they could represent partial surface protein sequences (derived from EST or GSS). This observation is consistent with the genome of <it>S. salmonicida </it>encoding a large gene family of cysteine-rich variant surface proteins, as established for the VSP protein family in <it>G. lamblia </it>where only one of the 150 VSP genes is expressed per cell. In <it>G. lamblia </it>the VSP gene family displays antigenic variation and new VSP genes are induced at a relatively high frequency, which is important for escaping the host's adaptive immune system <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B59">59</abbr><abbr bid="B62">62</abbr></abbrgrp>. Further sequence data and analyses, as well as expression and cellular localization studies are needed to understand the function of this large protein family in <it>S. salmonicida</it>.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Structural organization of the two identified full-length candidate surface proteins with cysteine rich segments</p>
               </caption>
               <text>
                  <p><b>Structural organization of the two identified full-length candidate surface proteins with cysteine rich segments</b>. A: Domain organization of the putative protein encoded by Sp10orf2 (573 residues) [GenBank:<ext-link ext-link-type="gen" ext-link-id="DQ812527">DQ812527</ext-link>]. The diagram shows the position of the seven furin-like domains (SM00261 &#8211; orange boxes) relative the transmembrane domain (blue box) as determined by SMART4.0 [125]. Several variations were inferred by SMART including some where furin-like domains corresponded to the related EGF-like domain (SM00181 &#8211; green boxes, see below). Due to the overlap between these inferences only the furin-like domains are shown for simplicity. The orientation of the protein in the membrane is N-terminus outside and C-terminus inside as inferred by TMHMM2.0 [126]. This is consistent with the hypothesis that cysteine-rich domains are facing the extracellular milieu where they could interact with other proteins. The alignment of the seven inferred furin-like domains as inferred by T-COFFEE [127] is shown below the diagram, with the positions of the first and last residue of each domain indicated on the left. Cysteines are highlighted in red and bold. No putative signal peptide was found with SignalP3.0 [128]. B: Domain organization of the putative protein encoded by Sp1orf4 (453 residues) [GenBank:<ext-link ext-link-type="gen" ext-link-id="DQ812518">DQ812518</ext-link>]. This protein has a similar structural organization as the one shown in A with three EGF-like domains inferred to face the external milieu. The three EGF-like domains were aligned manually. In addition, this sequence may have a signal peptide (indicated by a red box) since the S-score is positive in SignalP3.0 [128]. C: Domain organization of <it>G. lamblia </it>VSP417-6 protein (704 residues) [GenBank:<ext-link ext-link-type="gen" ext-link-id="AAF02907">AAF02907</ext-link>] [129] is shown for comparison. Four furin-like and two EGF-like domains identified by SMART4.0 [125] were aligned with T-COFFEE [127]. The <it>G. lamblia </it>sequence possesses a signal peptide according to SignalP3.0 [128]. All diagrams are drawn to scale.</p>
               </text>
               <graphic file="1471-2164-8-51-3"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Insights into the molecular basis of <it>S. salmonicida </it>pathogenicity</p>
            </st>
            <p><it>Spironucleus </it>species have been described as a cause of disease in hosts that include birds, fish and mice <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>; <it>S. salmonicida</it>, for example, is a problem for the fish industry <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr></abbrgrp>. However, essentially nothing is known about virulence factors in <it>Spironucleus</it>. In healthy fish, the parasite <it>Spironucleus vortens </it>is commonly found in the flagellated stage (trophozoites) in the lumen of the upper intestine, where it remains attached to the intestinal mucosa, controlled by the mucosal immune system of the host. This stage of infection can cause diarrhea, but villus atrophy, ulceration or inflammation are thought to be absent <abbrgrp><abbr bid="B63">63</abbr></abbrgrp>, which is similar to observations during <it>G. lamblia </it>infections <abbrgrp><abbr bid="B62">62</abbr></abbrgrp>. Antigenic variation among the identified cysteine-rich proteins in <it>S. salmonicida </it>could potentially protect the parasite against secretory antibodies at the mucosal surfaces. Nitric oxide (NO) and reactive oxygen species (ROS) are important factors in the host's protection against mucosal pathogens <abbrgrp><abbr bid="B62">62</abbr></abbrgrp>. <it>S. salmonicida </it>encodes at least two rubrerythrins, two A-type flavoproteins and arginine deiminase (Additional file <supplr sid="S2">2</supplr>). These proteins, which are coded by genes putatively acquired from prokaryotes via gene transfer (see below), protect other microbes against ROS and NO <abbrgrp><abbr bid="B62">62</abbr><abbr bid="B64">64</abbr><abbr bid="B65">65</abbr></abbrgrp>, and similar roles are likely in <it>S. salmonicida</it>.</p>
            <p>In the laboratory, <it>Spironucleus muris </it>is transmitted as cysts in fecal material like <it>Giardia </it><abbrgrp><abbr bid="B66">66</abbr></abbrgrp>. Cysts of the genus <it>Spironucleus </it>share many morphological features with those of <it>Giardia </it>including the presence of two to four nuclei, flagellar axonemes, and a distinct cyst wall. Cysts of <it>S. muris </it>even display the same immunostaining as <it>Giardia </it>cysts when labeled with antibodies specific for <it>Giardia </it>cyst wall <abbrgrp><abbr bid="B66">66</abbr></abbrgrp>. We identified one homolog of <it>G. lamblia </it>cyst wall proteins, and two enzymes involved in the production of the sugar components of the cyst wall (glucosamine-6-phosphate isomerase and UDP-N-acetylglucosamine pyrophosphorylase &#8211; Additional file <supplr sid="S2">2</supplr>). The presence of these three genes indicate that <it>S. salmonicida </it>may also be able to form cysts, an interesting possibility since nothing yet is known of how <it>S. salmonicida </it>is spread and how it initiates infection in fish. These genes are stage-specifically expressed in the <it>G. lamblia </it>life cycle, suggesting that studies of their expression might identify regulatory regions of stage-specific genes in <it>Spironucleus</it>. Characteristic features of <it>Giardia </it>cysts include fragments of the adhesive disk but this structure, involved in attachment of <it>Giardia</it>, is conspicuously absent from <it>Spironucleus </it>cells. None of the genes encoding disc-specific proteins in <it>G. lamblia </it>were identified in this genomic survey, consistent with the absence of this structure in <it>S. salmonicida</it>.</p>
            <p>In contrast to <it>G. lamblia</it>, trophozoites of <it>S. salmonicida </it>can enter the blood causing systemic and organ infections <abbrgrp><abbr bid="B67">67</abbr></abbrgrp>. Cysteine proteases are essential for pathogenicity and invasion of the intestine of <it>E. histolytica </it><abbrgrp><abbr bid="B68">68</abbr></abbrgrp>. Therefore the several cysteine proteases that were found in our genomic survey are potential virulence factors possibly involved in invasion/tissue destruction by <it>S. salmonicida</it>. Secretion of cysteine proteases was indeed recently shown to occur from trophozoites of <it>G. lamblia </it>upon interaction with epithelial cells <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. Cysteine protease activities are also important for excystation and encystation of <it>Giardia </it><abbrgrp><abbr bid="B70">70</abbr><abbr bid="B71">71</abbr></abbrgrp>, suggesting yet another potential role for these enzymes in <it>S. salmonicida</it>.</p>
         </sec>
         <sec>
            <st>
               <p>Distinct codon usage patterns in highly versus weakly expressed genes</p>
            </st>
            <p>Genome-wide mutational processes have been identified as the main determinant for codon-usage variations among genomes in all three domains of life, while variations within genomes may be explained by selection <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp>. We analyzed sequences of 1153 genes to examine the variations of codon usage in the <it>S. salmonicida </it>genome (Table <tblr tid="T2">2</tblr>). The random sequencing of ESTs from a non-normalized cDNA library provided a rough estimate of the expression levels of <it>S. salmonicida </it>genes, since the number of occurrences of a specific gene among the sampled clones should be correlated with the amount of mRNA in the cells that the cDNA library were created from. Analysis of the genes represented by more than ten EST clones ("highly expressed") showed a strong codon-usage bias where one or two codons dominate for each amino acid, while some codons are very rare (Table <tblr tid="T2">2</tblr>). A distinct pattern was found for genes never found in the EST library ("weakly expressed"), for which codon usage is more uniform, with no codons strongly dominating. To compare our results with a previous study from <it>Giardia </it><abbrgrp><abbr bid="B74">74</abbr></abbrgrp>, 438 <it>G. lamblia </it>homologs to the <it>S. salmonicida </it>genes included in the codon-usage analysis were extracted. In the absence of information on expression levels, the <it>G. lamblia </it>genes were categorized according to the number of ESTs for their <it>S. salmonicida </it>homologs. The analysis revealed a pattern very similar to the previous study on a much smaller dataset <abbrgrp><abbr bid="B74">74</abbr></abbrgrp>: codons ending with C or G dominate over codons ending with A or U in putatively highly expressed genes, while the putatively weakly expressed genes have a more uniform amino acid usage.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Codon usage in highly and weakly expressed genes</p>
               </caption>
               <tblbdy cols="20">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Spiro </it>hi<sup>1</sup></b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Spiro </it>weak<sup>2</sup></b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Giardia </it>hi<sup>3</sup></b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Giardia </it>weak<sup>4</sup></b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Spiro </it>hi<sup>1</sup></b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Spiro </it>weak<sup>2</sup></b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Giardia </it>hi<sup>3</sup></b>
                        </p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>
                           <b><it>Giardia </it>weak<sup>4</sup></b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>#</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>RSCU</b>
                           <sup>5</sup>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="20">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Phe</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UUU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>80</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.62</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3520</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.21</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>51</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.41</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3584</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.99</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Ser</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UCU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>208</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>3.11</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2235</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.51</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>75</p>
                     </c>
                     <c ca="center">
                        <p>1.20</p>
                     </c>
                     <c ca="center">
                        <p>3962</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.53</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UUC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>180</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.38</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2317</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.79</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>197</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.59</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3689</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.01</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UCC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>114</p>
                     </c>
                     <c ca="center">
                        <p>1.71</p>
                     </c>
                     <c ca="center">
                        <p>1009</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.68</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>125</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.01</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2559</p>
                     </c>
                     <c ca="center">
                        <p>0.99</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Leu</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UUA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>62</p>
                     </c>
                     <c ca="center">
                        <p>0.77</p>
                     </c>
                     <c ca="center">
                        <p>3475</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.84</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.05</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1394</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.44</it>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UCA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>0.57</p>
                     </c>
                     <c ca="center">
                        <p>2035</p>
                     </c>
                     <c ca="center">
                        <p>1.38</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>0.35</p>
                     </c>
                     <c ca="center">
                        <p>2218</p>
                     </c>
                     <c ca="center">
                        <p>0.86</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UUG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>17</p>
                     </c>
                     <c ca="center">
                        <p>0.21</p>
                     </c>
                     <c ca="center">
                        <p>1639</p>
                     </c>
                     <c ca="center">
                        <p>0.87</p>
                     </c>
                     <c ca="center">
                        <p>27</p>
                     </c>
                     <c ca="center">
                        <p>0.32</p>
                     </c>
                     <c ca="center">
                        <p>2466</p>
                     </c>
                     <c ca="center">
                        <p>0.77</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UCG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.10</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1027</p>
                     </c>
                     <c ca="center">
                        <p>0.69</p>
                     </c>
                     <c ca="center">
                        <p>77</p>
                     </c>
                     <c ca="center">
                        <p>1.24</p>
                     </c>
                     <c ca="center">
                        <p>1825</p>
                     </c>
                     <c ca="center">
                        <p>0.70</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CUU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>184</p>
                     </c>
                     <c ca="center">
                        <p>2.30</p>
                     </c>
                     <c ca="center">
                        <p>2163</p>
                     </c>
                     <c ca="center">
                        <p>1.15</p>
                     </c>
                     <c ca="center">
                        <p>123</p>
                     </c>
                     <c ca="center">
                        <p>1.44</p>
                     </c>
                     <c ca="center">
                        <p>5060</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.59</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Pro</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CCU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>142</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.27</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1372</p>
                     </c>
                     <c ca="center">
                        <p>1.31</p>
                     </c>
                     <c ca="center">
                        <p>49</p>
                     </c>
                     <c ca="center">
                        <p>0.65</p>
                     </c>
                     <c ca="center">
                        <p>2177</p>
                     </c>
                     <c ca="center">
                        <p>1.05</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CUC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>210</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.62</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1470</p>
                     </c>
                     <c ca="center">
                        <p>0.78</p>
                     </c>
                     <c ca="center">
                        <p>239</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.80</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4307</p>
                     </c>
                     <c ca="center">
                        <p>1.35</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CCC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>87</p>
                     </c>
                     <c ca="center">
                        <p>1.39</p>
                     </c>
                     <c ca="center">
                        <p>650</p>
                     </c>
                     <c ca="center">
                        <p>0.62</p>
                     </c>
                     <c ca="center">
                        <p>118</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.56</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2010</p>
                     </c>
                     <c ca="center">
                        <p>0.97</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CUA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.00</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1220</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.65</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>15</p>
                     </c>
                     <c ca="center">
                        <p>0.18</p>
                     </c>
                     <c ca="center">
                        <p>2302</p>
                     </c>
                     <c ca="center">
                        <p>0.72</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CCA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>20</p>
                     </c>
                     <c ca="center">
                        <p>0.32</p>
                     </c>
                     <c ca="center">
                        <p>1570</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.50</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>41</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.54</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2369</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.14</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CUG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>0.09</p>
                     </c>
                     <c ca="center">
                        <p>1366</p>
                     </c>
                     <c ca="center">
                        <p>0.72</p>
                     </c>
                     <c ca="center">
                        <p>105</p>
                     </c>
                     <c ca="center">
                        <p>1.23</p>
                     </c>
                     <c ca="center">
                        <p>3601</p>
                     </c>
                     <c ca="center">
                        <p>1.13</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CCG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.02</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>608</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.58</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>94</p>
                     </c>
                     <c ca="center">
                        <p>1.25</p>
                     </c>
                     <c ca="center">
                        <p>1720</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.83</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Ile</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AUU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>155</p>
                     </c>
                     <c ca="center">
                        <p>0.96</p>
                     </c>
                     <c ca="center">
                        <p>4600</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.52</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>92</p>
                     </c>
                     <c ca="center">
                        <p>0.62</p>
                     </c>
                     <c ca="center">
                        <p>4220</p>
                     </c>
                     <c ca="center">
                        <p>1.09</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Thr</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>ACU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>194</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.90</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2206</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.36</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>45</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.53</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2757</p>
                     </c>
                     <c ca="center">
                        <p>0.97</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AUC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>302</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.87</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1977</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.66</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>302</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.05</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4272</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.11</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>ACC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>170</p>
                     </c>
                     <c ca="center">
                        <p>1.66</p>
                     </c>
                     <c ca="center">
                        <p>1322</p>
                     </c>
                     <c ca="center">
                        <p>0.81</p>
                     </c>
                     <c ca="center">
                        <p>103</p>
                     </c>
                     <c ca="center">
                        <p>1.22</p>
                     </c>
                     <c ca="center">
                        <p>2811</p>
                     </c>
                     <c ca="center">
                        <p>0.98</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AUA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>28</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.17</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2476</p>
                     </c>
                     <c ca="center">
                        <p>0.82</p>
                     </c>
                     <c ca="center">
                        <p>48</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.33</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3086</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.80</it>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>ACA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>0.33</p>
                     </c>
                     <c ca="center">
                        <p>1929</p>
                     </c>
                     <c ca="center">
                        <p>1.19</p>
                     </c>
                     <c ca="center">
                        <p>57</p>
                     </c>
                     <c ca="center">
                        <p>0.68</p>
                     </c>
                     <c ca="center">
                        <p>3544</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.24</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Met</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AUG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>164</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>2280</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>181</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>4180</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>ACG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.11</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1047</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.64</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>132</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.57</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2306</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.81</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Val</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GUU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>261</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.09</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2782</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.61</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>98</p>
                     </c>
                     <c ca="center">
                        <p>0.77</p>
                     </c>
                     <c ca="center">
                        <p>3608</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.27</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Ala</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GCU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>321</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.48</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2448</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.27</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>118</p>
                     </c>
                     <c ca="center">
                        <p>0.82</p>
                     </c>
                     <c ca="center">
                        <p>3529</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GUC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>140</p>
                     </c>
                     <c ca="center">
                        <p>1.12</p>
                     </c>
                     <c ca="center">
                        <p>1252</p>
                     </c>
                     <c ca="center">
                        <p>0.72</p>
                     </c>
                     <c ca="center">
                        <p>297</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.32</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3375</p>
                     </c>
                     <c ca="center">
                        <p>1.18</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GCC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>143</p>
                     </c>
                     <c ca="center">
                        <p>1.11</p>
                     </c>
                     <c ca="center">
                        <p>1570</p>
                     </c>
                     <c ca="center">
                        <p>0.82</p>
                     </c>
                     <c ca="center">
                        <p>228</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.59</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3738</p>
                     </c>
                     <c ca="center">
                        <p>1.06</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GUA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>81</p>
                     </c>
                     <c ca="center">
                        <p>0.65</p>
                     </c>
                     <c ca="center">
                        <p>1668</p>
                     </c>
                     <c ca="center">
                        <p>0.97</p>
                     </c>
                     <c ca="center">
                        <p>27</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.21</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1591</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.56</it>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GCA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>46</p>
                     </c>
                     <c ca="center">
                        <p>0.36</p>
                     </c>
                     <c ca="center">
                        <p>2233</p>
                     </c>
                     <c ca="center">
                        <p>1.16</p>
                     </c>
                     <c ca="center">
                        <p>96</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.67</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4588</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.30</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GUG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.14</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1210</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.70</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>90</p>
                     </c>
                     <c ca="center">
                        <p>0.70</p>
                     </c>
                     <c ca="center">
                        <p>2819</p>
                     </c>
                     <c ca="center">
                        <p>0.99</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GCG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.05</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1437</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.75</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>132</p>
                     </c>
                     <c ca="center">
                        <p>0.92</p>
                     </c>
                     <c ca="center">
                        <p>2310</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.65</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Tyr</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UAU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>145</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.34</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2703</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.31</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>59</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.55</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3095</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>1.00</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Cys</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UGU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>45</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.58</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1943</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.80</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>28</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.39</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1437</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.80</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UAC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>71</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.66</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1430</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.69</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>156</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.45</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3110</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.00</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UGC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>110</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.42</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2893</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.20</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>116</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.61</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2137</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.20</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Gln/TER</b>
                           <sup>6</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UAA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>58</p>
                     </c>
                     <c ca="center">
                        <p>0.83</p>
                     </c>
                     <c ca="center">
                        <p>3576</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.67</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>21</p>
                     </c>
                     <c ca="center">
                        <p>1.91</p>
                     </c>
                     <c ca="center">
                        <p>54</p>
                     </c>
                     <c ca="center">
                        <p>0.94</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>TER</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UGA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>30</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>140</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>0.55</p>
                     </c>
                     <c ca="center">
                        <p>62</p>
                     </c>
                     <c ca="center">
                        <p>1.08</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UAG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>44</p>
                     </c>
                     <c ca="center">
                        <p>0.63</p>
                     </c>
                     <c ca="center">
                        <p>1697</p>
                     </c>
                     <c ca="center">
                        <p>0.79</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>0.55</p>
                     </c>
                     <c ca="center">
                        <p>56</p>
                     </c>
                     <c ca="center">
                        <p>0.98</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Trp</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>UGG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>50</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>752</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>57</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                     <c ca="center">
                        <p>1458</p>
                     </c>
                     <c ca="center">
                        <p>1.00</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>His</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CAU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>70</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.85</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1239</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.22</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>17</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.22</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1595</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.85</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Arg</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CGU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>235</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>3.37</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>764</p>
                     </c>
                     <c ca="center">
                        <p>0.99</p>
                     </c>
                     <c ca="center">
                        <p>100</p>
                     </c>
                     <c ca="center">
                        <p>1.18</p>
                     </c>
                     <c ca="center">
                        <p>1661</p>
                     </c>
                     <c ca="center">
                        <p>1.04</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CAC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>95</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.15</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>796</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.78</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>136</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.78</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2151</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.15</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CGC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>30</p>
                     </c>
                     <c ca="center">
                        <p>0.43</p>
                     </c>
                     <c ca="center">
                        <p>781</p>
                     </c>
                     <c ca="center">
                        <p>1.02</p>
                     </c>
                     <c ca="center">
                        <p>253</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.98</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2403</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.51</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Gln</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CAA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>30</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.43</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1500</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.70</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>25</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.23</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2676</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.73</it>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CGA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.01</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>392</p>
                     </c>
                     <c ca="center">
                        <p>0.51</p>
                     </c>
                     <c ca="center">
                        <p>19</p>
                     </c>
                     <c ca="center">
                        <p>0.22</p>
                     </c>
                     <c ca="center">
                        <p>1115</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.70</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CAG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>147</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.11</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1791</p>
                     </c>
                     <c ca="center">
                        <p>0.84</p>
                     </c>
                     <c ca="center">
                        <p>192</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.77</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4640</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.27</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>CGG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.01</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>352</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.46</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.08</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1324</p>
                     </c>
                     <c ca="center">
                        <p>0.83</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Asn</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AAU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>106</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.68</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4502</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.28</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>61</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.43</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3571</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.91</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Ser</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AGU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>0.15</p>
                     </c>
                     <c ca="center">
                        <p>1269</p>
                     </c>
                     <c ca="center">
                        <p>0.86</p>
                     </c>
                     <c ca="center">
                        <p>15</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.24</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1818</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.70</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AAC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>208</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.32</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2544</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.72</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>226</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.57</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4291</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.09</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AGC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>24</p>
                     </c>
                     <c ca="center">
                        <p>0.36</p>
                     </c>
                     <c ca="center">
                        <p>1296</p>
                     </c>
                     <c ca="center">
                        <p>0.88</p>
                     </c>
                     <c ca="center">
                        <p>60</p>
                     </c>
                     <c ca="center">
                        <p>0.96</p>
                     </c>
                     <c ca="center">
                        <p>3171</p>
                     </c>
                     <c ca="center">
                        <p>1.22</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Lys</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AAA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>191</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.59</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>5117</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.28</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>50</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.16</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2778</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.53</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Arg</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AGA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>141</p>
                     </c>
                     <c ca="center">
                        <p>2.02</p>
                     </c>
                     <c ca="center">
                        <p>1694</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>2.20</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>39</p>
                     </c>
                     <c ca="center">
                        <p>0.46</p>
                     </c>
                     <c ca="center">
                        <p>1575</p>
                     </c>
                     <c ca="center">
                        <p>0.99</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AAG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>458</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.41</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2902</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.72</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>565</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.84</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>7623</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.47</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>AGG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>0.16</p>
                     </c>
                     <c ca="center">
                        <p>628</p>
                     </c>
                     <c ca="center">
                        <p>0.82</p>
                     </c>
                     <c ca="center">
                        <p>91</p>
                     </c>
                     <c ca="center">
                        <p>1.07</p>
                     </c>
                     <c ca="center">
                        <p>1459</p>
                     </c>
                     <c ca="center">
                        <p>0.92</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Asp</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GAU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>208</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.28</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>3993</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.26</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>100</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.55</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>5063</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.97</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Gly</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GGU</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>345</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>3.03</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2029</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.24</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>88</p>
                     </c>
                     <c ca="center">
                        <p>0.73</p>
                     </c>
                     <c ca="center">
                        <p>1923</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.79</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GAC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>116</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.72</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2333</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.74</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>264</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.45</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>5424</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.03</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GGC</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>71</p>
                     </c>
                     <c ca="center">
                        <p>0.62</p>
                     </c>
                     <c ca="center">
                        <p>1672</p>
                     </c>
                     <c ca="center">
                        <p>1.02</p>
                     </c>
                     <c ca="center">
                        <p>215</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.77</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2699</p>
                     </c>
                     <c ca="center">
                        <p>1.11</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>
                           <b>Glu</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GAA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>325</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.53</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4444</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.24</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>53</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.24</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4072</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.71</it>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GGA</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>0.31</p>
                     </c>
                     <c ca="center">
                        <p>1816</p>
                     </c>
                     <c ca="center">
                        <p>1.11</p>
                     </c>
                     <c ca="center">
                        <p>59</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.49</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2797</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.15</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GAG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>101</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.47</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>2716</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.76</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>389</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.76</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>7431</p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>1.29</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>GGG</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.04</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>1029</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.63</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>123</p>
                     </c>
                     <c ca="center">
                        <p>1.01</p>
                     </c>
                     <c ca="center">
                        <p>2342</p>
                     </c>
                     <c ca="center">
                        <p>0.96</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>1)</sup><it>S. salmonicida </it>genes represented by more than 10 ESTs (35 genes, 6948 codons)</p>
                  <p><sup>2)</sup><it>S. salmonicida </it>genes unrepresented among the ESTs (682 genes, 122846 codons)</p>
                  <p><sup>3)</sup><it>G. lamblia </it>homologs to <it>S. salmonicida </it>genes represented by more than 10 ESTs (33 genes, 7004 codons)</p>
                  <p><sup>4)</sup><it>G. lamblia </it>homologs to <it>S. salmonicida </it>genes unrepresented among the ESTs (172 genes, 184988 codons)</p>
                  <p><sup>5)</sup>Relative synonymous codon usage; the most and least abundant codons for each amino acid are indicated with boldface and italic font, respectively.</p>
                  <p><sup>6)</sup>UAA and UAG encode glutamine in <it>Spironucleus</it>, and are termination codons in <it>Giardia </it>[25, 26].</p>
               </tblfn>
            </tbl>
         </sec>
         <sec>
            <st>
               <p>Selection on codon usage in highly expressed <it>S. salmonicida </it>genes</p>
            </st>
            <p>To investigate the codon usage in more detail, we plotted the effective number of codons calculated with a method that accounts for variations in the nucleotide composition (N<sub>c</sub>') <abbrgrp><abbr bid="B75">75</abbr></abbrgrp> against the G+C content in the third synonymous position (GC3<sub>s</sub>), and performed correspondence analyses on the relative synonymous codon usage, for both the <it>Spironuclues </it>and <it>Giardia </it>datasets (Figure <figr fid="F4">4</figr>). The highly expressed <it>S. salmonicida </it>genes are centered in the plot with GC3<sub>s </sub>values around 0.4, and show lower N<sub>c</sub>' values than the weakly expressed genes with similar GC3<sub>s </sub>values, indicative of non-random synonymous codon usage (Figure <figr fid="F4">4A</figr>). For <it>G. lamblia</it>, the putatively highly expressed genes exhibit slightly higher GC3<sub>s </sub>and lower N<sub>c</sub>' values than the majority of the genes (Figure <figr fid="F4">4B</figr>). However, a separation of the genes into different categories can be observed: the vast majority of the weakly expressed genes have GC3<sub>s </sub>values between 0.4 and 0.7, while the highly expressed genes have slightly higher values (Figure <figr fid="F4">4B</figr>). Correspondence analyses showed that the G+C content in the third synonymous position is the main determinant of the codon usage in both <it>S. salmonicida </it>and <it>G. lamblia</it>; GC3<sub>s </sub>showed a strong correlation with the first axis (R<sup>2 </sup>= 0.969 and 0.944, respectively: data not shown). Expression levels strongly influence the second axis in the correspondence analysis for <it>S. salmonicida</it>; the highly expressed genes are located at the top separated from the majority of the weakly expressed genes, when axis 2 is plotted against axis 1 (Figure <figr fid="F4">4C</figr>). No such trend is observed for <it>G. lamblia</it>, for which the putative expression levels seem mainly to be correlated with axis 1 (GC3<sub>s</sub>) (Figure <figr fid="F4">4D</figr>). These analyses clearly indicate that there is selection on codon usage in <it>S. salmonicida </it>genes classified as putatively highly expressed, and suggest that their <it>G. lamblia </it>homologs also are under selection (Figure <figr fid="F4">4</figr> and Table <tblr tid="T2">2</tblr>). Translation efficiency has previously been suggested as the cause of the selection in highly expressed genes in <it>G. lamblia</it>, based on a much smaller data set <abbrgrp><abbr bid="B74">74</abbr></abbrgrp>, even though only estimates of expression levels were available for a few of the genes. Our study provides, for a much larger dataset, a connection between the subset of genes with a strong codon bias, and an indirect indication of expression levels (cDNA abundance), corroborating the earlier conclusion and extending it to the distantly related diplomonad <it>S. salmonicida</it>.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Comparisons of codon usage in <it>S. salmonicida </it>and <it>G. lamblia</it></p>
               </caption>
               <text>
                  <p><b>Comparisons of codon usage in <it>S. salmonicida </it>and <it>G. lamblia</it></b>. A and B: The effective number of codons, N<sub>c</sub>', plotted against the synonymous G+C content in the third codon position (GC3<sub>s</sub>) of 1153 <it>S. salmonicida </it>genes (A) and 438 homologs in <it>G. lamblia </it>(B). Genes are represented by different colors and symbols according to the number of times they were sampled within the EST data. Genes identified to be involved in gene transfer and are shared with <it>G. lamblia </it>(LGT Diplo), or unique to <it>S. salmonicida </it>(LGT Spiro), are indicated by black and red squares, respectively (see Additional file <supplr sid="S3">3</supplr>). If the observed codon usage pattern is more uniform than expected by chance, the N<sub>c</sub>' value is set to 61 [75, 117]. C and D: Correspondence analysis of the relative synonymous codon usage (RSCU) values for the same genes as in A and B for <it>S. salmonicida </it>(C) and <it>G. lamblia </it>(D). The candidate LGTs unique to <it>S. salmonicida</it>, and shared with <it>G. lamblia</it>, are indicated by red and black open squares, respectively.</p>
               </text>
               <graphic file="1471-2164-8-51-4"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>A shift in codon usage within diplomonads</p>
            </st>
            <p>Interestingly, the favored codons differed between <it>S. salmonicida </it>and <it>G. lamblia </it>for ten amino acids, while the same codon is most abundant for eight (two amino acids are encoded by only a single codon) (Table <tblr tid="T2">2</tblr>). In nine of the cases where there is a difference between the two species, <it>S. salmonicida </it>preferentially uses a codon ending with U, while <it>G. lamblia </it>uses a C-ending codon in eight cases and a G-ending codon once. The tenth case is a two-fold degenerate amino acid where <it>S. salmonicida </it>and <it>G. lamblia </it>prefer A- and C-ending codons, respectively (Table <tblr tid="T2">2</tblr>). Thus, in general <it>S. salmonicida </it>favors A+U rich codons, while <it>G. lamblia </it>prefers codons with G or C in the third position in putatively highly expressed genes. There is a distinction between the base compositional biases in <it>G. lamblia </it>and <it>S. salmonicida</it>; the average G+C content of the <it>S. salmonicida </it>sequences in our dataset is 36%, and the majority of the weakly expressed genes have GC3<sub>s </sub>values around 20%, while the weakly expressed <it>G. lamblia </it>genes have GC3<sub>s </sub>around 50% close to the genomic G+C content of <it>G. lamblia </it><abbrgrp><abbr bid="B60">60</abbr></abbrgrp> (Figure <figr fid="F4">4A, B</figr>). This is an expected pattern if mainly mutational processes have shaped the codon usage <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp>. However, the genomic G+C content differences seem to have influenced the codon preferences in the two diplomonad lineages in the highly expressed genes as well. In the absence of information about codon usage in a closely related outgroup, it is difficult to determine in which of the two lineages reassignment of the optimal codons has occurred. At any rate, the usage of an alternative genetic code in <it>Spironucleus </it>but not <it>Giardia </it><abbrgrp><abbr bid="B26">26</abbr></abbrgrp> indicates that codon usage have been remodeled in the lineage leading to <it>Spironucleus</it>, at least for the stop and glutamine codons. The canonical stop codon UAA is indeed the most common codon for glutamine in our dataset (Table <tblr tid="T2">2</tblr>), as expected in a G+C poor genome if the codon usage is close to mutational equilibrium <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Unusual codon usage in a subset of <it>S. salmonicida </it>genes</p>
            </st>
            <p>We observed large variation among GC3<sub>s </sub>values for weakly expressed genes in <it>S. salmonicida</it>. Unexpectedly, the N<sub>c</sub>' values for genes with GC3<sub>s </sub>above 0.5 are negatively correlated with GC3<sub>s</sub> (Figure <figr fid="F4">4A</figr>); if only the background nucleotide composition shaped the codon usage for these genes, the N<sub>c</sub>' values should be close to the maximum. This pattern indicates that there is selection on the codon usage in the group of weakly expressed genes with high GC3<sub>s </sub>values. However, selection for the set of optimal codons for highly expressed genes does not explain this pattern, as they include both G+C rich and G+C poor codons (Table <tblr tid="T2">2</tblr>). Also, the large spread of the genes to the left on axis 1 (which is strongly correlated with GC3<sub>s  </sub>&#8211; Figure  <figr fid="F4">4C</figr>) argues against selection for an alternative set of optimal codons in these genes. Furthermore, the deviating GC3<sub>s </sub>values in these genes are probably not due to recent introductions into the <it>S. salmonicida </it>genome from heterogeneous sources by lateral gene transfer (LGT). Although some genes with high GC3<sub>s </sub>values do show indications of gene transfer in the phylogenomic analyses, the majority do not (Figure <figr fid="F4">4A, C</figr>). In fact, many of these genes have homologs in <it>Giardia</it>, indicating that they were present in the common ancestor of the two lineages, strongly suggesting that the deviated GC3<sub>s </sub>and N<sub>c</sub>' values arose during the evolution of diplomonads on the branch leading to <it>S. salmonicida</it>.</p>
            <p>Analyses of the finished contigs also yielded unexpected results; the base compositional bias in segments of the <it>S. salmonicida </it>genome seems to be markedly towards G+C, while the largest part of the genome shows a compositional bias towards A+T (Figure <figr fid="F1">1</figr>). This pattern is in contrast with the A+T rich genomes of <it>D. discoideum</it>, <it>E. histolytica</it>, and <it>Plasmodium falciparum</it>, which show a relatively uniform nucleotide composition across all chromosomal regions <abbrgrp><abbr bid="B76">76</abbr><abbr bid="B77">77</abbr></abbrgrp>. The genes with deviating G+C content are correlated with these genomic regions of high G+C content (Figure <figr fid="F1">1</figr>). Furthermore, genes in G+C rich regions have higher GC3<sub>s </sub>values than the average G+C content for the genes (their bars are located above the sliding window analysis in Figure <figr fid="F1">1</figr>). Conversely, as expected, genes in G+C poor regions have low GC3<sub>s </sub>values. Thus, genes with unexpected codon usage (i.e. high GC3<sub>s </sub>values) are located in specific regions of the genome. However, neither mutational or selection scenarios can easily explain their non-random codon usage, nor the fluctuations in G+C content along the genome. Heterogeneity in overall G+C content (and/or GC3s) across the genome has been also observed in <it>Saccharomyces cerevisiae </it><abbrgrp><abbr bid="B78">78</abbr></abbrgrp> and in vertebrate genomes (e.g. isochores) <abbrgrp><abbr bid="B79">79</abbr></abbrgrp>. For <it>S. cerevisiae </it>(a unicellular eukaryote with a compact genome, that is more directly comparable to <it>S. salmonicida </it>than vertebrates) a number of possible explanations have been advanced such as regional variation in propensities for mutation or recombination and partitioning of the genome into "distinct replicational and transcriptional domains" during specific cell cycle phases that may experience different chemical environments [see <abbrgrp><abbr bid="B78">78</abbr></abbrgrp> and references therein]. Longer genomic fragments, as well as comparative data from more-closely related diplomonads, will be needed to characterize the pattern further in <it>S. salmonicida </it>and to tease apart possible causes for this peculiar phenomenon.</p>
         </sec>
         <sec>
            <st>
               <p>Phylogenomic analysis reveals frequent lateral gene transfer</p>
            </st>
            <p>We and others have previously studied the occurrence of LGT in diplomonads on a single-gene basis <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr><abbr bid="B31">31</abbr></abbrgrp>, <abbrgrp><abbr bid="B80">80</abbr><abbr bid="B81">81</abbr><abbr bid="B82">82</abbr></abbrgrp>. Here we present a systematic phylogenomic analysis of the complete EST and GSS data sets with the goal of identifying <it>S. salmonicida </it>genes that have been involved in LGT. We used the PhyloGenie package <abbrgrp><abbr bid="B83">83</abbr></abbrgrp> to assemble aligned amino acid data sets automatically from databases including both published sequences and data from ongoing eukaryotic genome projects (see Methods). Among the 711 genes with three or more identified homologs for which more than 100 amino acid positions could be aligned, 84 were retained as genes putatively involved in LGT affecting the <it>S. salmonicida </it>lineage, on the basis of unexpected phylogenetic positions (Figure <figr fid="F5">5</figr>, Additional files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>). Cases where two <it>S. salmonicida </it>genes branched as a monophyletic group in the phylogenetic tree to the exclusion of other sequence were interpreted as gene duplication event after the gene transfer. Taking this into account, the 84 genes putatively involved in LGT corresponded to 68 unique gene transfer events at most; multiple genes may indeed have been introduced in a single event in some cases.</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Phylogenetic trees of five <it>S. salmonicida </it>genes from the phylogenomic analysis</p>
               </caption>
               <text>
                  <p><b>Phylogenetic trees of five <it>S. salmonicida </it>genes from the phylogenomic analysis</b>. ML tree of conceptually translated, aligned amino acid positions of (A) arginine deiminase, (B) conserved hypothetical protein, (C) conserved hypothetical protein, (D) carotenoid isomerase, and (E) rubrerythrin. Bootstrap support values > 50% are shown. Details about the phylogenetic analyses are found in the Methods section, and complete accession numbers and complete species names are found in Additional files <supplr sid="S4">4</supplr> and <supplr sid="S6">6</supplr>. The unrooted trees are arbitrarily rooted for the presentation. The branches and species names are labeled according to their phylogenetic classification: Archaea (red), proteobacteria (grey), low G+C Gram positives (blue), cyanobacteria (green), and other eubacterial lineages (black). Eukaryotes are in boldface and labeled according to their classification into super-groups [18]: Opisthokonta (orange), Amoebozoa (purple), Chromalveolata (red), Archaeplastida (green), and Excavata (brown).</p>
               </text>
               <graphic file="1471-2164-8-51-5"/>
            </fig>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p>A table showing the genes putatively involved in LGT events.</p>
               </text>
               <file name="1471-2164-8-51-S3.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S4">
               <title>
                  <p>Additional file 4</p>
               </title>
               <text>
                  <p>Phylogenetic trees 1&#8211;25 for genes putatively involved in LGT events and listed in Additional file 3.</p>
               </text>
               <file name="1471-2164-8-51-S4.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S5">
               <title>
                  <p>Additional file 5</p>
               </title>
               <text>
                  <p>Phylogenetic trees 26&#8211;50 for genes putatively involved in LGT events and listed in Additional file 3.</p>
               </text>
               <file name="1471-2164-8-51-S5.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S6">
               <title>
                  <p>Additional file 6</p>
               </title>
               <text>
                  <p>Phylogenetic trees 51&#8211;72 for genes putatively involved in LGT events and listed in Additional file 3.</p>
               </text>
               <file name="1471-2164-8-51-S6.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>In principle, contamination in our libraries could falsely indicate a pattern of frequent gene transfer affecting the <it>S. salmonicida </it>genome. However, we strongly believe this not to be case. 57 of the 84 putatively transferred genes formed a monophyletic group with <it>G. lamblia </it>homologs in the phylogenetic analyses indicating that these genes were present in the common ancestor of the two species (Additional Files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>). Furthermore, on average five in-frame UAG and UAA sense codons (which are termination codons in all characterized prokaryotes <abbrgrp><abbr bid="B84">84</abbr></abbrgrp>) were detected in 21 of the remaining 27 putatively transferred genes, strongly suggesting a true <it>S. salmonicida </it>origin also for these genes. Four of the six genes without UAG or UAA codons formed a monophyletic group with a <it>S. salmonicida </it>gene which does utilize such codons, indicating a likely origin by gene duplication. We cannot formally exclude contamination on the basis of presence of alternative codons for the remaining two sequences (gTor1213bT7 and gZap260bT7, trees #59 and #64 in Additional file <supplr sid="S6">6</supplr>), but notice that the absence of in-frame UAG and UAA codons in these genes could likely be due to a recent introduction from a donor utilizing the canonical genetic code. At any rate, together these observations indicate that the phylogenetic pattern we interpret as putative LGT events are unlikely to result from substantial contamination of our libraries.</p>
            <p>The strength and type of support for the inferred gene transfer events varied between genes in the phylogenomic analysis. Some <it>Spironucleus </it>genes were strongly associated with genes from distantly related organisms. For example, the <it>S. salmonicida </it>carotenoid isomerases were found to be nested within proteobacterial sequences (Figure <figr fid="F5">5D</figr>). Such anomalous positions of the diplomonads genes strongly suggest gene transfer events. Many datasets contain sequences from only one or a few eukaryotic taxa other than diplomonads (Figure <figr fid="F5">5A, C, E</figr>), and in some, diplomonads are the only eukaryotes present (Figure <figr fid="F5">5B&#8211;D</figr>). Although the separation of diplomonad from the other eukaryotic sequences is sometimes weak (i.e. Figure <figr fid="F5">5E</figr>), we suggest that LGT is a more likely explanation for their origin than differential gene losses and/or phylogenetic artefacts, as we have argued previously for genes with a patchy phylogenetic distribution among eukaryotes <abbrgrp><abbr bid="B80">80</abbr></abbrgrp>.</p>
            <p>There are indeed examples of inferences of LGT based on unexpected patterns of phyletic distribution that have previously been shown to be wrong. Re-analyses of the putative bacteria-to-vertebrate gene transfer events in the human genome using phylogenetic analyses instead of similarity searches showed that more parsimonious alternative explanations existed for the vast majority, if not all, of the reported cases <abbrgrp><abbr bid="B85">85</abbr></abbrgrp>. Phylogenetic analyses may also lead to false positive interpretations of LGT. For example, phylogenetic analysis indicated an LGT origin of the <it>T. vaginalis </it>hydrogenosomal NuoF protein distinct from the mitochondrial homologs <abbrgrp><abbr bid="B86">86</abbr></abbrgrp>, a conclusion shown likely to be incorrect upon re-analysis using more realistic models of sequence evolution <abbrgrp><abbr bid="B87">87</abbr></abbrgrp>. On the other hand, re-analyses using extended taxon sampling and more advanced models of sequence evolution of four genes putatively affected by prokaryote-to-protist LGT resulted in support for a larger number of inter-domain gene transfer events, rather than a fewer number as expected if differential gene loss, and/or phylogenetic artefacts caused the initial indications of gene transfer <abbrgrp><abbr bid="B30">30</abbr><abbr bid="B80">80</abbr></abbrgrp>. Obviously, inferences about LGT from the phylogenetic analyses depend on the accuracy of the phylogenetic method, as well as on the breadth of organismal representation in sequence databases. Therefore, it is inevitable that the list of putative LGTs will include both false positives and false negatives (Additional files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>). Nevertheless, our phylogenomic analysis indicates that vertical inheritance combined with gene duplication and gene loss is rather unlikely to have produced the observed phylogenetic relationships and patchy taxonomic distributions and that gene transfer is the simplest hypothesis currently available to explain these trees. Hence our analyses indicate that LGT has been an important mechanism in the evolution of the <it>S. salmonicida </it>genome.</p>
         </sec>
         <sec>
            <st>
               <p>Acquisitions of prokaryotic metabolic genes in the evolution of protist genomes</p>
            </st>
            <p>The vast majority of genes inferred to be involved in gene-transfer events are metabolic genes (74%) or encode conserved hypothetical proteins (20%) (Additional file <supplr sid="S3">3</supplr>). This bias is not unexpected, as a higher rate of transfer for metabolic genes compared to informational genes has been observed for prokaryotes <abbrgrp><abbr bid="B88">88</abbr><abbr bid="B89">89</abbr></abbrgrp> and, on a smaller scale, in diplomonads <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> and <it>E. histolytica </it><abbrgrp><abbr bid="B51">51</abbr></abbrgrp>. In the latter study it was suggested that this protist parasite had expanded its metabolic repertoire via gene acquisitions from prokaryotes present in the environment, and the same may apply for <it>S. salmonicida</it>. For example, amino acids have been identified to be a source of energy in diplomonads via the arginine dihydrolase pathway <abbrgrp><abbr bid="B2">2</abbr></abbrgrp> especially under limited oxygen conditions <abbrgrp><abbr bid="B90">90</abbr></abbrgrp>. Among eukaryotes, this pathway has been detected only in <it>Trichomonas </it>and diplomonads. The genes for two enzymes in the pathway, arginine deiminase and ornithine transcarbamoylase, appear to have been acquired from prokaryotes in a common ancestor of diplomonads and parabasalids, whereas carbamate kinase may have distinct LGT origins in the two groups (Figure <figr fid="F5">5A</figr> and trees #10 and #30 in Additional file <supplr sid="S4">4</supplr>). Similarly, <it>S. salmonicida </it>encodes rubrerythrins and A-type flavoproteins, proteins putatively involved in the protection against the host's defense (see above) <abbrgrp><abbr bid="B62">62</abbr><abbr bid="B64">64</abbr><abbr bid="B65">65</abbr></abbrgrp> that are also found in anaerobic prokaryotes and eukaryotes including <it>Entamoeba </it>(Figure <figr fid="F5">5E</figr> and Additional files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>) <abbrgrp><abbr bid="B51">51</abbr><abbr bid="B80">80</abbr></abbrgrp>. The phylogenetic distributions of these genes suggest a role related to an anaerobic lifestyle, consistent with the hypothesis that these acquisitions provided metabolic advantages to the recipient protist lineages. Indeed, distantly related lineages that live in the same environment appear to frequently transfer genes <abbrgrp><abbr bid="B89">89</abbr></abbrgrp>. Increased taxon sampling and more detailed studies of the ecology and metabolism/biochemistry of the organisms represented by sequences in our trees will likely recognize shared environments between the donor and recipient lineages for additional acquired metabolic genes (Additional file <supplr sid="S3">3</supplr>).</p>
         </sec>
         <sec>
            <st>
               <p>Continuous exchange of genes with all domains of life</p>
            </st>
            <p>In this study we have identified 84 genes of putatively lateral origin, and in previous phylogenomic studies 96 <it>E. histoytica </it>genes, almost 50 kinetoplastid genes, 24 in <it>Cryptosporidium parvum </it>and 148 genes in anaerobic ciliates were found to represent candidate LGT genes <abbrgrp><abbr bid="B51">51</abbr><abbr bid="B55">55</abbr><abbr bid="B91">91</abbr><abbr bid="B92">92</abbr></abbrgrp>. Thus, numerous inter-domain gene transfer events have been identified in four divergent protist lineages &#8211; <it>Spironucleus</it>, <it>Entamoeba</it>, kinetoplastids (<it>Trypanosoma </it>and <it>Leishmania</it>) and anaerobic ciliates &#8211; supporting the idea that gene acquisition from prokaryotic organisms is a common evolutionary mechanism in unicellular eukaryotes <abbrgrp><abbr bid="B22">22</abbr><abbr bid="B93">93</abbr><abbr bid="B94">94</abbr><abbr bid="B95">95</abbr></abbrgrp>. In all these studies, metabolic genes have been found to be the most common functional category among the genes implicated in LGT genes. This observation, which is consistent with the complexity hypothesis <abbrgrp><abbr bid="B88">88</abbr></abbrgrp>, could indicate that metabolic adaptation is a selective force for inter-domain gene transfer events from prokaryotes to protists <abbrgrp><abbr bid="B96">96</abbr><abbr bid="B97">97</abbr></abbrgrp>.</p>
            <p><it>G. lamblia </it>homologs that form clades with the <it>S. salmonicida </it>sequences were found in 49 of the 68 putative LGT events, while no closely related <it>G. lamblia </it>homologs were found in the remaining 19 cases (Figure <figr fid="F5">5</figr> and Additional file <supplr sid="S3">3</supplr>). Thus, at least 72% of the putative LGT events happened before the divergence of the <it>Spironucleus </it>and <it>Giardia </it>lineages. The remaining 19 events could have taken place in the <it>S. salmonicida </it>lineage after the divergence from the lineage leading to <it>G. lamblia</it>, although gene losses in the latter could also explain the observed pattern. If these represented relatively recent gene transfers, they should show a codon-usage pattern distinct from that of other <it>S. salmonicida </it>genes. Some in fact do show deviant codon usage indices (Figure <figr fid="F5">5A, B</figr>) suggesting a more recent acquisition compared to the other cases. However, there are many other <it>S. salmonicida </it>genes with deviant codon usage that do not show any indication of LGT (Figure <figr fid="F4">4A, B</figr>), suggesting that codon usage pattern alone is a poor indicator of LGT in <it>S. salmonicida</it>, as shown in other systems <abbrgrp><abbr bid="B98">98</abbr></abbrgrp>. In 12 cases where both <it>Spironucleus </it>and <it>Giardia </it>sequences are present, <it>T. vaginalis </it>sequences are found as a sister group to the diplomonad cluster. This pattern has previously been observed for candidate laterally transferred genes <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B80">80</abbr></abbrgrp> and almost certainly reflects a common ancestry of diplomonads and parabasalids to the exclusion of other sampled eukaryotic lineages, although the possibility of gene transfer between the two lineages cannot be formally excluded. However, a diplomonad-parabasalia relationship has recently been shown to be robust in several phylogenetic analyses of concatenated protein sequences <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr></abbrgrp>. As some acquired genes are unique to <it>S. salmonicida</it>, others shared with <it>G. lamblia</it>, and some are also shared with <it>T. vaginalis</it>, this strongly suggests that genes have been acquired by LGT in these excavate lineages continuously throughout their evolutionary history. Further characterization of the phylogenetic distribution of these genes may provide information about organismal relationships within Excavata <abbrgrp><abbr bid="B99">99</abbr></abbrgrp>.</p>
            <p>In the four previous phylogenomic studies of LGT in protists <abbrgrp><abbr bid="B51">51</abbr><abbr bid="B55">55</abbr><abbr bid="B91">91</abbr><abbr bid="B92">92</abbr></abbrgrp> only prokaryote-to-eukaryote transfer events were examined. Our selection procedure allowed us to detect additional evolutionary scenarios where a prokaryotic gene is transferred to a eukaryote, and then possibly further transferred to a second eukaryotic lineage. For example, the arginine deaminase gene was likely acquired from a prokaryote by an ancestor of diplomonads and parabasalids, and then transferred to the lineage leading to <it>Dictyostelium </it>(Figure <figr fid="F5">5A</figr>). Seventeen genes were putatively affected by intra-domain LGT, corresponding to 13 unique events (Additional file <supplr sid="S3">3</supplr>). Twelve of these cases are exchanges between the lineage leading to <it>S. salmonicida </it>and amoebozoan lineages; five cases involve gene exchange with the <it>Dictyostelium </it>lineage, six cases with the <it>Entamoeba </it>lineage, and a single case with the <it>Mastigamoeba </it>lineage (Figure <figr fid="F5">5A</figr>, Additional files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>). In sharp contrast, only a single intra-domain gene transfer event representing other eukaryotes was detected, although opisthokonts are comparatively well sampled with genome sequences, and several diverse and complete, or nearly complete, chromalveolate sequences were present in our data sets (Additional files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>). It is noteworthy that only genes that have been acquired from prokaryotes and have subsequently been transferred within the eukaryotic domain will be detected using our selection procedure. Additional eukaryote-to-eukaryote transfers may actually have occurred among the genes that did not show any indication of prokaryote-to-eukaryote transfer. A few examples of gene transfers between unicellular eukaryotic organisms have indeed been published recently <abbrgrp><abbr bid="B22">22</abbr><abbr bid="B80">80</abbr><abbr bid="B100">100</abbr><abbr bid="B101">101</abbr></abbrgrp>. The 13 putative intra-domain transfers identified here further suggest that LGT between protists is an evolutionary mechanism that should not be neglected.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>The vast majority of eukaryotic diversity is represented by protists <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, yet only a few protist genome sequencing projects have been published. Our sequence survey study has indicated that a combined approach using both random sampling from the genome (GSSs) and ESTs is successful in identifying genes (Table <tblr tid="T1">1</tblr>). We identified 817 genes from the GSS sequences, while 473 genes with homologies in other organisms were detected among the EST sequences. As we have collected more than twice as many GSS as EST sequences, EST sequencing would appear to be slightly more effective for gene discovery, if only quantity is considered, as expected. However, EST sequencing is biased towards identification of highly expressed genes, such as genes involved in genetic information processing, especially translation, while GSS sequencing detects a more random selection of genes (Table <tblr tid="T1">1</tblr>). This functional bias of the genes detected in EST surveys may be an advantage if the objective of the study is mainly to identify genes previously identified in other organisms using the same approach, but is a limitation if sampling gene diversity is the aim.</p>
         <p>We found that a combined approach of both GSS and EST sequencing can be successful in detecting both highly expressed (and probably also often widely distributed) genes and a more diverse gene set. In combination with complete sequencing of a few contigs, this approach was efficient in revealing much about the <it>S. salmonicida </it>genome. Although we could identify more than 600 genes with annotated functions, conserved hypothetical proteins still represent the largest category (Table <tblr tid="T1">1</tblr>), indicating that the genes with annotated functions give only a partial picture of the true coding potential. Furthermore, 13 among the 38 genes identified within the contigs did not show any significant sequence similarity to genes in the databases, and 81% and 45% of the GSS and EST sequences, respectively, failed to show significant similarity to any known genes. This suggests that a large fraction of the genes in <it>S. salmonicida </it>genome lack sequence similarity to known genes, despite the fact that a nearly complete <it>G. lamblia </it>gene complement is included in the public database. Thus, the <it>S. salmonicida </it>genome has a significant, and mostly unknown, coding potential. Still, the analyses of the genes that could be annotated not only identified individual <it>S. salmonicida </it>genes and metabolic pathways that provided insight into the biology and evolution of the organism. In addition, these analyses revealed several lineage-specific properties suggestive of a large genomic diversity between <it>S. salmonicida </it>and other studied eukaryotes, including its closest intensively studied relative, the diplomonad <it>G. lamblia</it>.</p>
         <p>Our analyses indeed indicate that diplomonad genomes are diverse. For example, in the <it>S. salmonicida </it>genome we identified gene acquisitions, a base compositional bias that varies along the genome, a codon usage distinct from that of <it>G. lamblia</it>, and differences in basic molecular biological processes such as polyadenylation. <it>G. lamblia </it>and <it>S. salmonicida </it>represent only two species within diplomonads, a paraphyletic group which may also include enteromonads and retortamonads, organisms with distinct morphological features <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr><abbr bid="B102">102</abbr></abbrgrp>. The understanding of these interesting groups of protists is very limited on the genomic level, and the genome projects of <it>G. lamblia </it><abbrgrp><abbr bid="B103">103</abbr></abbrgrp> and <it>Spironucleus vortens </it><abbrgrp><abbr bid="B104">104</abbr></abbrgrp>, another fish pathogen, will make major contributions. Still, diplomonads are very diverse, as manifested by a large degree of sequence divergence between members of the group, and, as indicated here, large variation in the genomic structure and content. Circumstantial evidence for a relatively small genome (see above), together with an overall G+C content of 36% and a low frequency of repeats, makes <it>S. salmonicida </it>an ideal candidate for a whole-genome sequencing project. Such an effort would yield further insights into the parasitic lifestyle of this organism, the fascinatingly diverse biology of diplomonads, and expand our appreciation of genome diversity and evolution among eukaryotes.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Sources of RNA and DNA, library construction, and sequencing</p>
            </st>
            <p><it>S. salmonicida </it>(ATCC 50380) <abbrgrp><abbr bid="B6">6</abbr></abbrgrp> (previously known as <it>S. barkhanus </it><abbrgrp><abbr bid="B5">5</abbr><abbr bid="B105">105</abbr></abbrgrp>) was grown in axenic culture following the ATCC protocol. Messenger RNA from approximately 10<sup>8 </sup>cells of <it>S. salmonicida </it>was isolated using the Dynabead mRNA system (Dynal), and cDNA was synthesized and cloned into the lambda Uni-Zap XR vector (Stratagene), according to the manufacturer's instructions. This procedure requires that the polyA tail is present in the mRNA to be cloned. Infection of SolR cells was carried out and plated on selective LB media containing carbenicillin, isopropyl &#946;-D-1-thiogalactopyranoside (IPTG) and 5-bromo-4-chloro-3-indolyl-beta-D-galactopyranoside (X-gal) for blue/white selection. Positive colonies were picked manually and plasmid DNA was purified using Perfectprep Plasmid Isolation Kit with the Perfectprep Plasmid 96 Vac system (Eppendorf). The DNA was quantified by electrophoresis on a 1% agarose gel. Sequencing was carried out on an ABI 377 (Applied Biosystems) using the ABI Big Dye Terminator Cycle Sequencing Ready Reaction Kit (Applied Biosystems) and the SK primer.</p>
            <p>Genomic DNA was purified using standard protocols. A genomic DNA library was constructed for GSS sequencing. The DNA was partially digested using <it>Sau</it>3AI and ligated to lambda Zap Express vector pre-digested with <it>BamH</it>I (Stratagene) according to the instructions. Mass <it>in vivo </it>excision of the pBK-CMV phagemid from the Zap Express vector was performed using XL-1 Blue MRF' cells and ExAssist phage with the XLOLR strain, and the cells were plated on LB with kanamycin, IPTG and X-gal for blue/white selection. Cells were picked and the plasmids were purified and sequenced as described above using the T3 and T7 primers. Roughly half of the sequencing was done from this library. However, since it was revealed that the insert sizes of this library were too short for efficient random sequencing, a second GSS library was constructed using 20 &#956;g genomic DNA. The DNA was physically sheared using a nebulizer, blunt ended, ligated to the insert DNA and cloned into plasmid vectors using the TOPO Shotgun Subcloning Kit (Invitrogen). One Shot chemically competent cells (Invitrogen) were transformed with an aliquot of the ligation mix and spread on LB plates containing kanamycin and X-gal for blue/white selection. Positive clones were manually picked and plasmids were purified using 96-well Plasmid Preparation Kit (Millipore). The plasmids were quantified and sequenced as described above using T3 and T7 primers.</p>
            <p>Finally, <it>S. salmonicida </it>DNA was partially digested with <it>Bam</it>HI and cloned into the lambda DASHII vector (Stratagene) according to the manufacturer's instructions, to make a library with larger inserts (8&#8211;28 kbp). The library was grown in MRA cells and spread on eight 150-mm plates each containing approximately 70,000 plaques. Three plaques were purified and the inserts were amplified by PCR, nebulized and the fragments were shotgun cloned into puc18 <it>Sma</it>I/BPA plasmids (Amersham Pharmacia). The ligations were transformed into XL2-Blue MRF' ultracompetent cells. Plasmids were purified and sequenced as described above using M13f and M13r primers.</p>
         </sec>
         <sec>
            <st>
               <p>Sequence analysis</p>
            </st>
            <p>Sequencing reactions were initially screened manually for exclusion of unsuccessful reactions. Sequences from 2408, 3204 and 3684 clones from the Uni-Zap XR EST, the Zap Express GSS and TOPO Shotgun Subcloning GSS libraries, respectively, passed this initial screen. The average read lengths of these were 540, 399 and 366 bp, respectively.</p>
            <p>The 2408 EST sequences were screened against the vector sequences and the <it>Escherichia coli </it>genome sequence using the Phred software <abbrgrp><abbr bid="B106">106</abbr></abbrgrp> to check for contamination of DNA from the library host, and clustered using the Phrap assembler <abbrgrp><abbr bid="B106">106</abbr></abbrgrp> with the default settings. The contigs were quality trimmed manually, while the singletons were trimmed using the Phred software <abbrgrp><abbr bid="B106">106</abbr></abbrgrp> with the default quality cut-off. Hybrid clones were identified as containing stretches of nine or more As within the insert, and only the 5' end of the hybrid was retained. 27 clones with inserts in the opposite direction were identified as starting with a stretch of Ts (15), or as having significant matches in the wrong direction to known genes (12); these were reversed. Finally, nine EST sequences were trimmed according to putative frame-shifts detected in similarity searches. After removal of contigs shorter than 100 bases 884 sequences (298 contigs and 586 singletons) corresponding to 502589 unique bp and based on 2341 clones remained for further analysis. 20 and 11 of these overlapped with published genes or genes from the finished contigs (see below), respectively, and were excluded, leaving 853 ESTs for further analyses.</p>
            <p>300 ESTs ended with a stretch of eight or more As, indicative of mRNA polyadenylation, were identified. Of these, 134 were annotated as coding based on sequence similarity to genes in the databases (see below). The region around the 3' end of the gene was aligned based on the position of the termination codons (UGA), and a sequence logo was created using WebLogo <abbrgrp><abbr bid="B107">107</abbr></abbrgrp>.</p>
            <p>The 6888 GSS sequences were trimmed using the Phred software <abbrgrp><abbr bid="B106">106</abbr></abbrgrp> with the default quality cut-off, and the vector sequences were masked and removed. All sequences were screened against the <it>E. coli </it>genome sequence. The 5275 GSS chromatograms that passed this screen (no host contamination was detected), and represented sequences longer than 100 bp, were included in the assembly. The average read lengths of the clones from the Zap Express GSS and TOPO Shotgun Subcloning GSS libraries that passed this screening were 543 and 472 bp, respectively. The Phrap assembler was used with the default settings, yielding 1008 contigs consisting of two or more sequences and 2208 singletons. Some of the longer contigs were selected for complete sequencing. Regions that required additional sequencing were identified within these contigs, and amplified from genomic DNA using PCR with primers designed based on the GSS assembled sequence. The PCR was performed under standard conditions using the following parameters: denaturing at 95&#176;C for 5 min, followed by forty cycles of denaturing at 94&#176;C for 30 s, annealing at 48&#176;C for 1 min, and extension at 72&#176;C for 2 min, and a final extension at 72&#176;C for 10 min. To extend the contigs, sequence gaps covered by clones were identified and amplified using PCR with specific primers based on the obtained shotgun sequences. The PCR products were purified using the Qiaquick PCR Purification Kit (Qiagen) and sequenced using the PCR primers as described above. This procedure resulted in eight continuous stretches of genomic sequence between 2365 and 9005 bp in length. Together with the three sequenced lambda clones these yielded 80504 bp of finished genomic sequence in eleven contigs which were covered by at least one-fold high quality sequence in each direction (Additional file <supplr sid="S1">1</supplr>). 205 of the 5275 GSS sequences overlapped with the completely sequence contigs and were excluded from further analysis. The remaining 5070 sequences were treated as single reads, and covered 2539160 bp of non-unique sequence after quality trimming.</p>
            <p>To estimate the amount of unique high-quality sequence within our survey project, we performed assemblies with only the quality trimmed sequence using the Staden package <abbrgrp><abbr bid="B108">108</abbr></abbrgrp>. The 5275 GSS clones yielded 2070953 bp in 3566 contigs with one or more sequences, and the addition of the EST clones gave 2549915 bp of unique high-quality sequence. Lander and Waterman proposed that the number of "islands" (E) in a genomic project with perfectly representative libraries with equal length of clones (sequences) is E = Ne<sup>-c&#963; </sup><abbrgrp><abbr bid="B109">109</abbr></abbrgrp>, where N is the number of clones sampled, c is the redundancy of coverage = LN/G, &#963; = 1 - T/L, L is the clone length (500.8 bp in our case), G is the haploid genome size in bp, and T is the amount of overlap in bp needed to detect overlap (20 bp). G is the only unknown parameter, and the equation can be solved: G = N(L-T)/ln(N/E). Using the information from our assembly (N = 5275; L = 500.8 bp; T = 20 bp; E = 3566), the genome of <it>S. salmonicida </it>was estimated to be 6.5 Mbp in size.</p>
         </sec>
         <sec>
            <st>
               <p>Databases</p>
            </st>
            <p>All databases used in the analyses were downloaded in January 2005. In addition to the non-redundant protein database downloaded from the National Center for Biotechnology Information (NCBI) <abbrgrp><abbr bid="B110">110</abbr></abbrgrp>, protein databases from various nearly completed genome sequencing projects of diverse eukaryotes were downloaded: <it>T. vaginalis </it>(parabasalid), <it>Tetrahymena thermophila </it>(ciliate), <it>Trypanosoma brucei</it>, and <it>Trypanosoma cruzi </it>(kinetoplastids) from the Institute for Genomic Research (TIGR) <abbrgrp><abbr bid="B111">111</abbr></abbrgrp>; <it>Dictyostelium discoideum </it>(mycetozoan) from dictyBase <abbrgrp><abbr bid="B112">112</abbr></abbrgrp>; <it>Chlamydomonas reinhardtii </it>(green alga), <it>Phytophthora sojae </it>(oomycete), and <it>Thalassiosira pseudonana </it>(diatom) from the DOE Joint Genome Institute (JGI) <abbrgrp><abbr bid="B104">104</abbr></abbrgrp>. The Kyoto Encyclopedia of Genes and Genomes (KEGG) databases were downloaded from the Kyoto University Bioinformatics Center <abbrgrp><abbr bid="B113">113</abbr></abbrgrp> for functional annotation purposes.</p>
         </sec>
         <sec>
            <st>
               <p>Gene identification</p>
            </st>
            <p>Various approaches were used to identify coding genes among the sequences. Similarity searches using BLASTx, version 2.2.13 <abbrgrp><abbr bid="B114">114</abbr></abbrgrp>, with the default settings with the nucleotide sequences from the single-read GSS and the EST contigs against the amino acid sequence databases were performed. 1179 single-read GSS sequences and 502 EST contigs yielded matches with E values better than e<sup>-5</sup>, which were considered a significant indication of a coding sequence. Using the indication of the frame and direction from the alignment between the query and database sequence in the BLAST result files, the putative coding DNA and amino acid sequences were extracted from these sequences. The 3891 single-read GSS sequences and 380 EST contigs that failed to yield a match better than e<sup>-5 </sup>were not analyzed further.</p>
            <p>To identify coding sequences in the finished contigs, similarity searches against the amino acid sequence databases and the EST sequences were performed using the same cutoff as above. Similarity searches on the nucleotide level against the non-redundant nucleotide databases were performed at NCBI to identify non-protein coding sequences. Finally, open reading frames longer than 450 bp with the expected GC pattern in the three coding positions were annotated as putatively coding and included in subsequent analyses. This procedure identified 38 protein-coding genes in the eleven finished contigs.</p>
            <p>tRNA genes were detected using two programs: tRNAscanSE version 1.23 <abbrgrp><abbr bid="B115">115</abbr></abbrgrp> with the maximum sensitivity (-C option), and ARAGORN version 1.1 <abbrgrp><abbr bid="B116">116</abbr></abbrgrp> with the default parameters. 20 tRNA genes were identified with both methods, all within GSS clones. For 19 of these, both programs assigned the same anticodon, while one differed in anticodon identity (see Results). Two tRNAs were found to encode putative introns. No tmRNA was found. Finally, similarity searches at the nucleotide level identified two genes encoding ribosomal RNA within one of the finished contigs.</p>
         </sec>
         <sec>
            <st>
               <p>Creation of a non-redundant dataset of <it>S. salmonicida </it>protein-coding genes</p>
            </st>
            <p>In order to explore the coding potential of <it>S. salmonicida</it>, we created a non-redundant dataset of <it>S. salmonicida </it>genes that contained only the longest amino acid sequence from each gene among the GSS, EST, finished contigs and previously published genes. Three of the 30 previously published genes were represented by long ESTs and were excluded. This procedure resulted in538 unique protein-coding genes. 175 of the 1179 genes identified within the GSSs were excluded because they were represented by longer ESTs or published sequences, while 30 were excluded because the extracted ORF was shorter than 100 bp. Furthermore, 176 of the remaining 974 genes identified within GSS sequences were excluded because they overlapped with a longer identical gene within the GSSs, leaving 798 unique protein coding genes identified within the GSS data. Thus, in total 1335 unique protein-coding genes were identified and included in further analyses.</p>
         </sec>
         <sec>
            <st>
               <p>Codon-usage analysis</p>
            </st>
            <p>1153 of the 1335 unique protein-coding sequences were 300 bp or longer and were included in the codon-usage analysis. Codon-usage indices were calculated for each gene. N<sub>c </sub>is a measure of the effective number of codons used in a gene <abbrgrp><abbr bid="B117">117</abbr></abbrgrp>. A modified version, N<sub>c</sub>', has been developed which also account for the background nucleotide composition of the gene; this is advantageous in situations where the composition varies among the genes analyzed <abbrgrp><abbr bid="B75">75</abbr></abbrgrp>. The N<sub>c</sub>' values were calculated using the software INCA <abbrgrp><abbr bid="B118">118</abbr></abbrgrp>. The GC3<sub>s </sub>values &#8211; the frequency of G+C in synonymously third codon positions (i.e. Met, Trp and termination codons are excluded) &#8211; were calculated using the program CodonW <abbrgrp><abbr bid="B119">119</abbr></abbrgrp>. The variation of codon usage among genes was explored using the correspondence analysis tool within CodonW. To avoid identification of trends in codon usage due to biased amino acid usage among the genes, the correspondence analysis was performed on the relative synonymous codon usage (RSCU) values for each gene. The RSCU value for a codon is the observed frequency divided by the frequency expected if all synonyms codons for that amino acid were used equally. This should remove the effects of amino acid composition on codon usage. RSCU values close to 1 indicate a lack of bias, while much higher and much lower values indicate preference and avoidance of that particular codon, respectively. The correspondence analysis plots genes according to their RSCU values in a 61-dimensional space, and then identifies the major trends as the axes through this multidimensional hyperspace which account for the largest fractions of variation among genes.</p>
            <p>To examine the variation of codon usage within diplomonads, similarity searches of the 1153 <it>S. salmonicida </it>amino acid sequences were performed against the <it>G. lamblia </it>protein sequences. 533 <it>S. salmonicida </it>genes gave matches with E values &lt; e<sup>-20</sup>, corresponding to 438 unique genes. These were considered homologs (not necessarily orthologs) and the nucleotide sequences were obtained for codon-usage analysis as described above.</p>
            <p>The number of times each gene was detected in the EST library was used as an indication of expression level in the cell. 35 genes were represented by more than ten individual EST sequences and were considered highly expressed, while 682 genes were not detected in the EST data and were considered weakly expressed. Codon-usage tables were calculated for each of these groups, both for <it>S. salmonicida </it>and the <it>G. lamblia </it>homologs. <it>G. lamblia </it>genes represented by several <it>S. salmonicida </it>genes were assigned the highest number of ESTs among the genes.</p>
         </sec>
         <sec>
            <st>
               <p>Gene annotation</p>
            </st>
            <p>The Kyoto Encyclopedia of Genes and Genomes (KEGG) project <abbrgrp><abbr bid="B113">113</abbr></abbrgrp>, a bioinformatic knowledge base for systematic analysis of gene functions <abbrgrp><abbr bid="B120">120</abbr></abbrgrp>, was used for gene annotation. The KEGG system links genomic information with higher-order functional information using a system with KEGG Orthology (KO) numbers. Gene sequences in the GENES database, which includes collection of gene catalogs from completely sequenced genomes, are assigned KO numbers which are used to extract higher-order information, such as functional categories and pathways, from the KO database <abbrgrp><abbr bid="B120">120</abbr></abbrgrp>.</p>
            <p>Similarity searches using BLASTx, version 2.2.13 <abbrgrp><abbr bid="B114">114</abbr></abbrgrp>, with the default settings were performed for the 1335 unique <it>S. salmonicida </it>protein-coding genes against the GENES database, using the E value cutoff e<sup>-5</sup>. 249 returned a best match to which a KO -number had been assigned, and an additional 301 had non-best hits with assigned KO numbers. Functional annotations were extracted from the KO database for these 550 genes. However, 27 genes were annotated in the functional category "Human Disease"; five of these could be manually assigned to functional categories, while 22 were classified as conserved hypothetical proteins. Thus, 528 genes could be assigned a function using the KEGG databases. Similarity searches against all databases were performed for the remaining 785 genes, using the E value cutoff e<sup>-20</sup>. 219 of these had matches, 63 of which could be used for functional annotation. No meaningful functional information could be found for remaining 156; these were annotated as conserved hypothetical proteins. In addition, the 553 genes which had best hits with E values between e<sup>-20 </sup>and e<sup>-5 </sup>were annotated as conserved hypothetical proteins, and the remaining 13 genes that did not have any match better than e<sup>-5 </sup>were annotated as hypothetical proteins. To summarize: 591 protein-coding genes could be assigned a putative function, 731 were conserved hypothetical proteins, and 13 hypothetical proteins. The annotations for all proteins mentioned in the text have been refined manually.</p>
            <p>The fraction of cysteine within the conceptually translated amino acid sequences was found to vary considerably between genes. While the majority of genes would encode a protein with cysteine content below 5%, 149 of the 1335 unique genes would encode a protein with more than 10% cysteine. These were annotated as cysteine-rich proteins. 122 are conserved hypothetical proteins, while 27 were assigned to functional categories.</p>
            <p>A data set of 1044 yeast proteins localized in the mitochondrion <abbrgrp><abbr bid="B121">121</abbr></abbrgrp> was used to search against the identified <it>S. salmonicida </it>proteins using BLASTp, version 2.2.13 <abbrgrp><abbr bid="B114">114</abbr></abbrgrp>, with the default settings. The matches with e values below e<sup>-5 </sup>were searched against the total yeast proteome with the same cutoff, which identified 71 reciprocal best matches between the datasets. Based on the quality of the BLASTp hit (or protein length, to short to give any confidence in the identified HSP), phylogenetic trees and functional annotation of BLAST hits, only two entries were considered as strong candidate mitochondrial/mitosomal proteins and one as possible candidate proteins (see main text).</p>
         </sec>
         <sec>
            <st>
               <p>Phylogenomic and phylogenetic analyses</p>
            </st>
            <p>One goal of this project was to identify genes in the <it>S. salmonicida </it>genome that have been affected by LGT. We used phylogenetic analyses to identify gene transfers, as similarity searches are only poor indicators of such events <abbrgrp><abbr bid="B122">122</abbr></abbrgrp>. We used the PhyloGenie package <abbrgrp><abbr bid="B83">83</abbr></abbrgrp> to perform efficient phylogenetic analyses for a large number of genes. It takes amino acid sequences in standard (fasta) format, and performs similarity searches (BLAST) against a protein sequence database consisting of publicly available databases and/or sequence data released from ongoing genome projects. The program uses HMMER <abbrgrp><abbr bid="B123">123</abbr></abbrgrp> to build a Hidden Markov Model (HMM) profile from the alignment in the BLAST result file, and uses it to search the full-length BLAST hits; sequences scoring better than a selected threshold are included in the dataset. Finally, an alignment of these sequences is made using the profile. No attempt was made to exclude putative paralogs from the datasets.</p>
            <p>Cysteine-rich proteins were excluded from the phylogenomic analysis, since they were found to be problematic to align probably due to their frequent possession of highly repetitive sequences. PhyloGenie was run on the 1174 annotated non-cysteine-rich genes with homologs in the databases, using default settings except that coverage of the query sequence compared to the database sequence was not used as a selection criteria (coverage = -1) since coverage is meaningless with partial gene sequences such as EST and GSSs, and the maximum number of sequences in the dataset was set, for practical reasons, to 200 (seqs = 200). Where more than 200 sequences pass the E-value cutoff, the 200 with the lowest E-values in the HMM-based search will be retained. A custom-implemented function (T. Frickey, personal communication) was used that allows for exclusion of similar sequences from the dataset based on the taxonomic level (i.e. only one sequence is retained as a representative of all <it>Bacillus </it>sequences above a set identity). To reduce the size of the dataset as much as possible without losing too much information, an identity cutoff of 80% was used regardless of the taxonomic description in the sequence (taxlevel = 0, maxsim = 0.8).</p>
            <p>These settings yielded 932 datasets with four sequences or more, among which 711 included 100 or more aligned amino acid positions assessed on the <it>S. salmonicida </it>input sequence. Only these were analyzed further, to avoid misleading results based on too-short alignments. A Perl script provided in the PhyloGenie package <abbrgrp><abbr bid="B83">83</abbr></abbrgrp> was modified to use the fast maximum likelihood program PHYML version 2.4.4 <abbrgrp><abbr bid="B124">124</abbr></abbrgrp>. Trees were obtained for each of the 711 datasets using this script and the default PHYML settings, except that the Whelan and Goldman (WAG) substitution model <abbrgrp><abbr bid="B124">124</abbr></abbrgrp> was used together with a mixed four-category discrete-gamma model of among-site rate variation plus invariable sites (WAG + &#915; + Inv).</p>
            <p>The trees were automatically rooted using the approach implemented in Phylogenie; taxonomic information for all sequences in each tree is used to put the root at the most-basal node that is most-distant from the sequence that was used to select the dataset [see Figure 4 in <abbrgrp><abbr bid="B83">83</abbr></abbrgrp> for details]. Phatg, the tree-browsing program within the PhyloGenie package <abbrgrp><abbr bid="B83">83</abbr></abbrgrp>, was used to identify 136 putative cases of LGT among the optimal trees, using the criterion that a diplomonad sequence was required to group with homologs from up to four different non-diplomonad eukaryotes within a prokaryotic clade. Manual inspection of the positive trees excluded from further analysis 31 trees for which the input <it>S. salmonicida </it>sequence failed to show convincing indications of LGT, or the <it>G. lamblia </it>homolog branched with a prokaryotic sequence. Bootstrap analyses were performed for the remaining 105 datasets, using 100 replicates and the methods and settings described above. Visual inspection of the consensus bootstrap trees yielded 84 that showed indications of LGT affecting <it>S. salmonicida</it>. Among these, two appear to be clones derived from different parts of the same <it>S. salmonicida </it>gene, and 14 are part of diplomonad gene clusters which may have formed via gene duplication events after a putative transfer event. Thus, our phylogenomic analysis identified 68 putative LGT events (Additional files <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>, <supplr sid="S6">6</supplr>).</p>
         </sec>
         <sec>
            <st>
               <p>Nucleotide sequence accession numbers</p>
            </st>
            <p>The sequences reported here were deposited in GenBank at the National Center for Biotechnology Information [Genbank:<ext-link ext-link-type="gen" ext-link-id="EC585128">EC585128</ext-link>-<ext-link ext-link-type="gen" ext-link-id="EC586011">EC586011</ext-link>, GenBank:<ext-link ext-link-type="gen" ext-link-id="DX913336">DX913336</ext-link>-<ext-link ext-link-type="gen" ext-link-id="DX918405">DX918405</ext-link>, GenBank:<ext-link ext-link-type="gen" ext-link-id="DQ812518">DQ812518</ext-link>-<ext-link ext-link-type="gen" ext-link-id="DQ812528">DQ812528</ext-link>].</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>JOA co-constructed the second GSS library, finished the sequence of seven contigs, carried out the EST and GSS assemblies, all phylogenetic and most bioinformatic analyses, and drafted and coordinated the editing of the manuscript. &#197;MS co-constructed the second GSS library, carried out the majority of the GSS sequencing, and performed initial bioinformatic analyses. DSH grew the organism, purified nucleic acids, constructed the EST library, and carried out some of the initial EST sequencing. CAM constructed the lambda and the initial GSS libraries, carried out the majority of the EST sequencing, the initial GSS sequencing and the sequencing and assembly of three lambda clones. PLD carried out some of the initial EST sequencing. SGS provided advice on the analyses of molecular biological aspects and drafted these parts of the manuscript. RPH performed part of the analyses of cysteine rich and putative mitosomal proteins. JML, MAR, RPH, and AJR co-initiated and supervised the project in their respective laboratories, provided advice on the analyses and edited the manuscript. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We thank T. Martin Embley for co-initiating and co-managing the early stages of this project, and Lesley Davis (Dalhousie University) for experimental assistance. The availability of preliminary sequences from the various sequencing centers is greatly acknowledged.</p>
            <p>This work was supported by a Swedish Research Council (VR) Grant awarded to JOA, a Canadian Institutes of Health Research (CIHR) Operating Grant MOP-62809 awarded to AJR, and a Natural Sciences and Engineering Research Council (NSERC) Genomics Project Grant 228263-99. AJR received fellowship support from the Alfred P. Sloan Foundation, and a New Investigator Fellowship from the CIHR/Peter Lougheed Medical Research Foundation, MAR is funded by Australian Research Council grant CE0348221, JML is funded by the Emory University Research Council, and RPH was funded by a Wellcome Trust career Development fellowship (grant #045702) and University Award (grant #060068). This collaboration was sponsored in part by the Canadian Institute for Advanced Research (CIAR), Program in Evolutionary Biology.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Order Diplomonadida</p>
            </title>
            <aug>
               <au>
                  <snm>Brugerolle</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>JJ</fnm>
               </au>
            </aug>
            <source>An Illustrated Guide to the Protozoa, 2nd edn</source>
            <publisher>Lawrence, Kansas , Society of Protozoologists</publisher>
            <editor>Lee JJ, Leedale GF, Bradbury P</editor>
            <pubdate>2002</pubdate>
            <fpage>1125</fpage>
            <lpage>1135</lpage>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Biology of <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Adam</snm>
                  <fnm>RD</fnm>
               </au>
            </aug>
            <source>Clin Microbiol Rev</source>
            <pubdate>2001</pubdate>
            <volume>14</volume>
            <issue>3</issue>
            <fpage>447</fpage>
            <lpage>475</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">88984</pubid>
                  <pubid idtype="pmpid">11432808</pubid>
                  <pubid idtype="doi">10.1128/CMR.14.3.447-475.2001</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Systemic hexamitid (Protozoa, Diplomonadida) infection in seawater pen-reared Chinook Salmon <it>Oncorhynchus tshawytscha</it></p>
            </title>
            <aug>
               <au>
                  <snm>Kent</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Ellis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Fournie</snm>
                  <fnm>JW</fnm>
               </au>
               <au>
                  <snm>Dawe</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Bagshaw</snm>
                  <fnm>JW</fnm>
               </au>
               <au>
                  <snm>Whitaker</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Dis Aquat Organ</source>
            <pubdate>1992</pubdate>
            <volume>14</volume>
            <issue>2</issue>
            <fpage>81</fpage>
            <lpage>89</lpage>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Systemic spironucleosis in sea-farmed Atlantic Salmon <it>Salmo salar</it>, caused by <it>Spironucleus barkhanus</it> transmitted from feral Arctic Char <it>Salvelinus alpinus</it>?</p>
            </title>
            <aug>
               <au>
                  <snm>Sterud</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Mo</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Poppe</snm>
                  <fnm>TT</fnm>
               </au>
            </aug>
            <source>Dis Aquat Organ</source>
            <pubdate>1998</pubdate>
            <volume>33</volume>
            <issue>1</issue>
            <fpage>63</fpage>
            <lpage>66</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">9653460</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Ultrastructure of <it>Spironucleus barkhanus</it> N. Sp. (Diplomonadida: Hexamitidae) from grayling <it>Thymallus thymallus</it> (L.) (Salmonidae) and Atlantic Salmon <it>Salmo salar</it> L. (Salmonidae)</p>
            </title>
            <aug>
               <au>
                  <snm>Sterud</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Mo</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Poppe</snm>
                  <fnm>TT</fnm>
               </au>
            </aug>
            <source>J Eukaryot Microbiol</source>
            <pubdate>1997</pubdate>
            <volume>44</volume>
            <fpage>399</fpage>
            <lpage>407</lpage>
         </bibl>
         <bibl id="B6">
            <title>
               <p>The marine pathogenic genotype of <it>Spironucleus barkhanus</it> from farmed salmonids redescribed as <it>Spironucleus salmonicida</it> n. sp</p>
            </title>
            <aug>
               <au>
                  <snm>J&#248;rgensen</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sterud</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>J Eukaryot Microbiol</source>
            <pubdate>2006</pubdate>
            <volume>53</volume>
            <issue>6</issue>
            <fpage>531</fpage>
            <lpage>541</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1550-7408.2006.00144.x</pubid>
                  <pubid idtype="pmpid">17123418</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Kingdom protozoa and its 18 phyla</p>
            </title>
            <aug>
               <au>
                  <snm>Cavalier Smith</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Microbiol Rev</source>
            <pubdate>1993</pubdate>
            <volume>57</volume>
            <issue>4</issue>
            <fpage>953</fpage>
            <lpage>994</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">372943</pubid>
                  <pubid idtype="pmpid">8302218</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Phylogenetic meaning of the kingdom concept: an unusual ribosomal RNA from <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Sogin</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Gunderson</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Elwood</snm>
                  <fnm>HJ</fnm>
               </au>
               <au>
                  <snm>Alonso</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Peattie</snm>
                  <fnm>DA</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1989</pubdate>
            <volume>243</volume>
            <issue>4887</issue>
            <fpage>75</fpage>
            <lpage>77</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.2911720</pubid>
                  <pubid idtype="pmpid">2911720</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>My favorite cell: <it>Giardia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Upcroft</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Upcroft</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Bioessays</source>
            <pubdate>1998</pubdate>
            <volume>20</volume>
            <fpage>256</fpage>
            <lpage>263</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1002/(SICI)1521-1878(199803)20:3&lt;256::AID-BIES9>3.0.CO;2-P</pubid>
                  <pubid idtype="pmpid">9631653</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Eukaryotic evolution, changes and challenges</p>
            </title>
            <aug>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>W</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2006</pubdate>
            <volume>440</volume>
            <issue>7084</issue>
            <fpage>623</fpage>
            <lpage>630</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature04546</pubid>
                  <pubid idtype="pmpid">16572163</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>The deep roots of eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Baldauf</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2003</pubdate>
            <volume>300</volume>
            <issue>5626</issue>
            <fpage>1703</fpage>
            <lpage>1706</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1085544</pubid>
                  <pubid idtype="pmpid">12805537</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>The real 'kingdoms' of eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Simpson</snm>
                  <fnm>AGB</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <issue>17</issue>
            <fpage>R693</fpage>
            <lpage>6</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cub.2004.08.038</pubid>
                  <pubid idtype="pmpid">15341755</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Root of the eukaryota tree as inferred from combined maximum likelihood analyses of multiple molecular sequence data</p>
            </title>
            <aug>
               <au>
                  <snm>Arisue</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Hasegawa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hashimoto</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <issue>3</issue>
            <fpage>409</fpage>
            <lpage>420</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi023</pubid>
                  <pubid idtype="pmpid">15496553</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Inference of the phylogenetic position of oxymonads based on nine genes: support for Metamonada and Excavata</p>
            </title>
            <aug>
               <au>
                  <snm>Hampl</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Horner</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Dyal</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Kulda</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Flegr</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Foster</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <issue>12</issue>
            <fpage>2508</fpage>
            <lpage>2518</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi245</pubid>
                  <pubid idtype="pmpid">16120804</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Comprehensive multi-gene phylogenies of excavate protists reveal the evolutionary positions of 'primitive' eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Simpson</snm>
                  <fnm>AGB</fnm>
               </au>
               <au>
                  <snm>Inagaki</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2006</pubdate>
            <volume>23</volume>
            <issue>3</issue>
            <fpage>615</fpage>
            <lpage>625</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msj068</pubid>
                  <pubid idtype="pmpid">16308337</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Unique phylogenetic relationship of glucokinase and glucosephosphate isomerase of the amitochondriate eukaryotes <it>Giardia intestinalis</it>, <it>Spironucleus barkhanus</it> and <it>Trichomonas vaginalis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Henze</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Horner</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Suguri</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Moore</snm>
                  <fnm>DV</fnm>
               </au>
               <au>
                  <snm>S&#225;nchez</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>M&#252;ller</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2001</pubdate>
            <volume>281</volume>
            <fpage>123</fpage>
            <lpage>131</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1119(01)00773-9</pubid>
                  <pubid idtype="pmpid">11750134</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Gene transfers from Nanoarchaeota to an ancestor of diplomonads and parabasalids</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
               <au>
                  <snm>Sarchfield</snm>
                  <fnm>SW</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <issue>1</issue>
            <fpage>85</fpage>
            <lpage>90</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msh254</pubid>
                  <pubid idtype="pmpid">15356278</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>The new higher level classification of eukaryotes with emphasis on the taxonomy of protists</p>
            </title>
            <aug>
               <au>
                  <snm>Adl</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Simpson</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Farmer</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Andersen</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Anderson</snm>
                  <fnm>OR</fnm>
               </au>
               <au>
                  <snm>Barta</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Bowser</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Brugerolle</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Fensome</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Fredericq</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>James</snm>
                  <fnm>TY</fnm>
               </au>
               <au>
                  <snm>Karpov</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kugrens</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Krug</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lane</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>LA</fnm>
               </au>
               <au>
                  <snm>Lodge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lynn</snm>
                  <fnm>DH</fnm>
               </au>
               <au>
                  <snm>Mann</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>McCourt</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Mendoza</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Moestrup</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Mozley-Standridge</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Nerad</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Shearer</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Smirnov</snm>
                  <fnm>AV</fnm>
               </au>
               <au>
                  <snm>Spiegel</snm>
                  <fnm>FW</fnm>
               </au>
               <au>
                  <snm>Taylor</snm>
                  <fnm>MF</fnm>
               </au>
            </aug>
            <source>J Eukaryot Microbiol</source>
            <pubdate>2005</pubdate>
            <volume>52</volume>
            <issue>5</issue>
            <fpage>399</fpage>
            <lpage>451</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1550-7408.2005.00053.x</pubid>
                  <pubid idtype="pmpid">16248873</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Mitochondrial remnant organelles of <it>Giardia</it> function in iron-sulphur protein maturation</p>
            </title>
            <aug>
               <au>
                  <snm>Tovar</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Le&#243;n-Avila</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>S&#225;nchez</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>Sutak</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Tachezy</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>van der Giezen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hern&#225;ndez</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>M&#252;ller</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lucocq</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2003</pubdate>
            <volume>426</volume>
            <issue>6963</issue>
            <fpage>172</fpage>
            <lpage>176</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01945</pubid>
                  <pubid idtype="pmpid">14614504</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>A spliceosomal intron in <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Nixon</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Morrison</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>McArthur</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Sogin</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Loftus</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Samuelson</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci U S A</source>
            <pubdate>2002</pubdate>
            <volume>99</volume>
            <issue>6</issue>
            <fpage>3701</fpage>
            <lpage>3705</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">122587</pubid>
                  <pubid idtype="pmpid">11854456</pubid>
                  <pubid idtype="doi">10.1073/pnas.042700299</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>An ancient spliceosomal intron in the ribosomal protein L7a gene (Rpl7a) of <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Russell</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Shutt</snm>
                  <fnm>TE</fnm>
               </au>
               <au>
                  <snm>Watkins</snm>
                  <fnm>RF</fnm>
               </au>
               <au>
                  <snm>Gray</snm>
                  <fnm>MW</fnm>
               </au>
            </aug>
            <source>BMC Evol Biol</source>
            <pubdate>2005</pubdate>
            <volume>5</volume>
            <issue>1</issue>
            <fpage>45</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1201135</pubid>
                  <pubid idtype="pmpid">16109161</pubid>
                  <pubid idtype="doi">10.1186/1471-2148-5-45</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Lateral gene transfer in eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
            </aug>
            <source>Cell Mol Life Sci</source>
            <pubdate>2005</pubdate>
            <volume>62</volume>
            <issue>11</issue>
            <fpage>1182</fpage>
            <lpage>1197</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00018-005-4539-z</pubid>
                  <pubid idtype="pmpid">15761667</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>The phylogenetic position of enteromonads: a challenge for the present models of diplomonad evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Kolisko</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Cepicka</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Hampl</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Kulda</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Flegr</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Int J Syst Evol Microbiol</source>
            <pubdate>2005</pubdate>
            <volume>55</volume>
            <issue>Pt 4</issue>
            <fpage>1729</fpage>
            <lpage>1733</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1099/ijs.0.63542-0</pubid>
                  <pubid idtype="pmpid">16014510</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Retortamonad flagellates are closely related to diplomonads - implications for the history of mitochondrial function in eukaryote evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Silberman</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Simpson</snm>
                  <fnm>AGB</fnm>
               </au>
               <au>
                  <snm>Kulda</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Cepicka</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Hampl</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2002</pubdate>
            <volume>19</volume>
            <issue>5</issue>
            <fpage>777</fpage>
            <lpage>786</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11961110</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>A non-canonical genetic code in an early diverging eukaryotic lineage</p>
            </title>
            <aug>
               <au>
                  <snm>Keeling</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Doolittle</snm>
                  <fnm>WF</fnm>
               </au>
            </aug>
            <source>EMBO J</source>
            <pubdate>1996</pubdate>
            <volume>15</volume>
            <issue>9</issue>
            <fpage>2285</fpage>
            <lpage>2290</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">450153</pubid>
                  <pubid idtype="pmpid">8641293</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Widespread and ancient distribution of a noncanonical genetic code in diplomonads</p>
            </title>
            <aug>
               <au>
                  <snm>Keeling</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Doolittle</snm>
                  <fnm>WF</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1997</pubdate>
            <volume>14</volume>
            <fpage>895</fpage>
            <lpage>901</lpage>
            <xrefbib>
               <pubid idtype="pmpid">9287422</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Evidence for Golgi bodies in proposed &#8217;Golgi-lacking&#8217;  lineages</p>
            </title>
            <aug>
               <au>
                  <snm>Dacks</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>LAM</fnm>
               </au>
               <au>
                  <snm>Sj&#246;gren</snm>
                  <fnm>&#197;M</fnm>
               </au>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Doolittle</snm>
                  <fnm>WF</fnm>
               </au>
            </aug>
            <source>Proc Biol Sci</source>
            <pubdate>2003</pubdate>
            <volume>270</volume>
            <issue>Suppl 2</issue>
            <fpage>S168</fpage>
            <lpage>171</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">14667372</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Chaperonin 60 phylogeny provides further evidence for secondary loss of mitochondria among putative early-branching eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Horner</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2001</pubdate>
            <volume>18</volume>
            <issue>10</issue>
            <fpage>1970</fpage>
            <lpage>1975</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11557802</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Fructose-1,6-biphosphate aldolases in amitochondriate protists constitute a single protein subfamily with eubacterial relationships</p>
            </title>
            <aug>
               <au>
                  <snm>S&#225;nchez</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>Horner</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Moore</snm>
                  <fnm>DV</fnm>
               </au>
               <au>
                  <snm>Henze</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>M&#252;ller</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2002</pubdate>
            <volume>295</volume>
            <fpage>51</fpage>
            <lpage>59</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1119(02)00804-1</pubid>
                  <pubid idtype="pmpid">12242011</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Phylogenetic analyses of diplomonad genes reveal frequent lateral gene transfers affecting eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
               <au>
                  <snm>Sj&#246;gren</snm>
                  <fnm>&#197;M</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>LAM</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <issue>2</issue>
            <fpage>94</fpage>
            <lpage>104</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0960-9822(03)00003-4</pubid>
                  <pubid idtype="pmpid">12546782</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Evolution of glutamate dehydrogenase genes: evidence for lateral gene transfer within and between prokaryotes and eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>BMC Evol Biol</source>
            <pubdate>2003</pubdate>
            <volume>3</volume>
            <fpage>14</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">166173</pubid>
                  <pubid idtype="pmpid">12820901</pubid>
                  <pubid idtype="doi">10.1186/1471-2148-3-14</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Iron hydrogenases and the evolution of anaerobic eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Horner</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Foster</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2000</pubdate>
            <volume>17</volume>
            <issue>11</issue>
            <fpage>1695</fpage>
            <lpage>1709</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11070057</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>A single eubacterial origin of eukaryotic pyruvate: ferredoxin oxidoreductase genes: implications for the evolution of anaerobic eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Horner</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Hirt</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1999</pubdate>
            <volume>16</volume>
            <issue>9</issue>
            <fpage>1280</fpage>
            <lpage>1291</lpage>
            <xrefbib>
               <pubid idtype="pmpid">10486982</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p><it>Giardia lamblia</it>: haploid genome size determined by pulsed field gel electrophoresis is less than 12 Mb</p>
            </title>
            <aug>
               <au>
                  <snm>Fan</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Korman</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Cantor</snm>
                  <fnm>CR</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>CL</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1991</pubdate>
            <volume>19</volume>
            <issue>8</issue>
            <fpage>1905</fpage>
            <lpage>1908</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">328122</pubid>
                  <pubid idtype="pmpid">2030969</pubid>
                  <pubid idtype="doi">10.1093/nar/19.8.1905</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>The guanine and cytosine content of genomic DNA and bacterial evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Muto</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Osawa</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci U S A</source>
            <pubdate>1987</pubdate>
            <volume>84</volume>
            <fpage>166</fpage>
            <lpage>169</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">304163</pubid>
                  <pubid idtype="pmpid">3467347</pubid>
                  <pubid idtype="doi">10.1073/pnas.84.1.166</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Overlapping genes in parasitic protist <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Iwabe</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Miyata</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2001</pubdate>
            <volume>280</volume>
            <issue>1-2</issue>
            <fpage>163</fpage>
            <lpage>167</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1119(01)00767-3</pubid>
                  <pubid idtype="pmpid">11738829</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Rearranged subtelomeric rRNA genes in <it>Giardia duodenalis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Upcroft</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Abedinia</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Upcroft</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Eukaryot Cell</source>
            <pubdate>2005</pubdate>
            <volume>4</volume>
            <issue>2</issue>
            <fpage>484</fpage>
            <lpage>486</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">549325</pubid>
                  <pubid idtype="pmpid">15701810</pubid>
                  <pubid idtype="doi">10.1128/EC.4.2.484-486.2005</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Developmental gene regulation in <it>Giardia lamblia</it>: first evidence for an encystation-specific promoter and differential 5' mRNA processing</p>
            </title>
            <aug>
               <au>
                  <snm>Knodler</snm>
                  <fnm>LA</fnm>
               </au>
               <au>
                  <snm>Sv&#228;rd</snm>
                  <fnm>SG</fnm>
               </au>
               <au>
                  <snm>Silberman</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Davids</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Gillin</snm>
                  <fnm>FD</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1999</pubdate>
            <volume>34</volume>
            <issue>2</issue>
            <fpage>327</fpage>
            <lpage>340</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.1999.01602.x</pubid>
                  <pubid idtype="pmpid">10564476</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Initiator and upstream elements in the &#945;2-tubulin promoter of <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Elmendorf</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Singer</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Pierce</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Cowan</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Nash</snm>
                  <fnm>TE</fnm>
               </au>
            </aug>
            <source>Mol Biochem Parasitol</source>
            <pubdate>2001</pubdate>
            <volume>113</volume>
            <issue>1</issue>
            <fpage>157</fpage>
            <lpage>169</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0166-6851(01)00211-0</pubid>
                  <pubid idtype="pmpid">11254964</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Translational control by the 3'-UTR: the ends specify the means</p>
            </title>
            <aug>
               <au>
                  <snm>Mazumder</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Seshadri</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Fox</snm>
                  <fnm>PL</fnm>
               </au>
            </aug>
            <source>Trends Biochem Sci</source>
            <pubdate>2003</pubdate>
            <volume>28</volume>
            <issue>2</issue>
            <fpage>91</fpage>
            <lpage>98</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0968-0004(03)00002-1</pubid>
                  <pubid idtype="pmpid">12575997</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Developmentally regulated transcripts and evidence of differential mRNA processing in <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Que</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Sv&#228;rd</snm>
                  <fnm>SG</fnm>
               </au>
               <au>
                  <snm>Meng</snm>
                  <fnm>TC</fnm>
               </au>
               <au>
                  <snm>Hetsko</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Aley</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Gillin</snm>
                  <fnm>FD</fnm>
               </au>
            </aug>
            <source>Mol Biochem Parasitol</source>
            <pubdate>1996</pubdate>
            <volume>81</volume>
            <issue>1</issue>
            <fpage>101</fpage>
            <lpage>110</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0166-6851(96)02698-9</pubid>
                  <pubid idtype="pmpid">8892309</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Eukaryotic mRNA 3' processing: a common means to different ends</p>
            </title>
            <aug>
               <au>
                  <snm>Gilmartin</snm>
                  <fnm>GM</fnm>
               </au>
            </aug>
            <source>Genes Dev</source>
            <pubdate>2005</pubdate>
            <volume>19</volume>
            <issue>21</issue>
            <fpage>2517</fpage>
            <lpage>2521</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1101/gad.1378105</pubid>
                  <pubid idtype="pmpid">16264187</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>The abundance of sterile transcripts in <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Elmendorf</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Singer</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Nash</snm>
                  <fnm>TE</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2001</pubdate>
            <volume>29</volume>
            <issue>22</issue>
            <fpage>4674</fpage>
            <lpage>4683</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">92544</pubid>
                  <pubid idtype="pmpid">11713317</pubid>
                  <pubid idtype="doi">10.1093/nar/29.22.4674</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Eukaryotic evolution: early origin of canonical introns</p>
            </title>
            <aug>
               <au>
                  <snm>Simpson</snm>
                  <fnm>AGB</fnm>
               </au>
               <au>
                  <snm>MacQuarrie</snm>
                  <fnm>EK</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2002</pubdate>
            <volume>419</volume>
            <issue>6904</issue>
            <fpage>270</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/419270a</pubid>
                  <pubid idtype="pmpid">12239559</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>The biology of intron gain and loss</p>
            </title>
            <aug>
               <au>
                  <snm>Jeffares</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Mourier</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Penny</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2005</pubdate>
            <xrefbib>
               <pubid idtype="pmpid">16290250</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Complex spliceosomal organization ancestral to extant eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Collins</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Penny</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <issue>4</issue>
            <fpage>1053</fpage>
            <lpage>1066</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi091</pubid>
                  <pubid idtype="pmpid">15659557</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>How selenium has altered our understanding of the genetic code</p>
            </title>
            <aug>
               <au>
                  <snm>Hatfield</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Gladyshev</snm>
                  <fnm>VN</fnm>
               </au>
            </aug>
            <source>Mol Cell Biol</source>
            <pubdate>2002</pubdate>
            <volume>22</volume>
            <issue>11</issue>
            <fpage>3565</fpage>
            <lpage>3576</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">133838</pubid>
                  <pubid idtype="pmpid">11997494</pubid>
                  <pubid idtype="doi">10.1128/MCB.22.11.3565-3576.2002</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>A selenocysteine tRNA and SECIS element in <it>Plasmodium falciparum</it></p>
            </title>
            <aug>
               <au>
                  <snm>Mourier</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Pain</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Griffiths-Jones</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>RNA</source>
            <pubdate>2005</pubdate>
            <volume>11</volume>
            <issue>2</issue>
            <fpage>119</fpage>
            <lpage>122</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1370700</pubid>
                  <pubid idtype="pmpid">15659354</pubid>
                  <pubid idtype="doi">10.1261/rna.7185605</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Selenocysteine tRNA identification in the model organisms <it>Dictyostelium discoideum</it> and <it>Tetrahymena thermophila</it></p>
            </title>
            <aug>
               <au>
                  <snm>Shrimali</snm>
                  <fnm>RK</fnm>
               </au>
               <au>
                  <snm>Lobanov</snm>
                  <fnm>AV</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>XM</fnm>
               </au>
               <au>
                  <snm>Rao</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carlson</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Mahadeo</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Parent</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Gladyshev</snm>
                  <fnm>VN</fnm>
               </au>
               <au>
                  <snm>Hatfield</snm>
                  <fnm>DL</fnm>
               </au>
            </aug>
            <source>Biochem Biophys Res Commun</source>
            <pubdate>2005</pubdate>
            <volume>329</volume>
            <issue>1</issue>
            <fpage>147</fpage>
            <lpage>151</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.bbrc.2005.01.120</pubid>
                  <pubid idtype="pmpid">15721286</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Identification of a very large Rab GTPase family in the parasitic protozoan <it>Trichomonas vaginalis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Lal</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Field</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Carlton</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Warwicker</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hirt</snm>
                  <fnm>RP</fnm>
               </au>
            </aug>
            <source>Mol Biochem Parasitol</source>
            <pubdate>2005</pubdate>
            <volume>143</volume>
            <issue>2</issue>
            <fpage>226</fpage>
            <lpage>235</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.molbiopara.2005.06.008</pubid>
                  <pubid idtype="pmpid">16099517</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>The genome of the protist parasite <it>Entamoeba histolytica</it></p>
            </title>
            <aug>
               <au>
                  <snm>Loftus</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Anderson</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Davies</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Alsmark</snm>
                  <fnm>UCM</fnm>
               </au>
               <au>
                  <snm>Samuelson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Amedeo</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Roncaglia</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Berriman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hirt</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Mann</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Nozaki</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Suh</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Pop</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Duchene</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ackers</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tannich</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Leippe</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hofer</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bruchhaus</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Willhoeft</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Bhattacharya</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Chillingworth</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Churcher</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Hance</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Harris</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Harris</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Jagels</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Moule</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ormond</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Squares</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Whitehead</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Quail</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Rabbinowitsch</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Norbertczak</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Price</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Guillen</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Gilchrist</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Stroup</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Bhattacharya</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lohia</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Foster</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Sicheritz-Ponten</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Weber</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Singh</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Mukherjee</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>El-Sayed</snm>
                  <fnm>NM</fnm>
               </au>
               <au>
                  <snm>Petri</snm>
                  <fnm>WA</fnm>
                  <suf>Jr.</suf>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>CG</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Fraser</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Hall</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2005</pubdate>
            <volume>433</volume>
            <issue>7028</issue>
            <fpage>865</fpage>
            <lpage>868</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03291</pubid>
                  <pubid idtype="pmpid">15729342</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Protein import, replication, and inheritance of a vestigial mitochondrion</p>
            </title>
            <aug>
               <au>
                  <snm>Regoes</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Zourmpanou</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Leon-Avila</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>van der Giezen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Tovar</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hehl</snm>
                  <fnm>AB</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2005</pubdate>
            <volume>280</volume>
            <issue>34</issue>
            <fpage>30557</fpage>
            <lpage>30563</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.M500787200</pubid>
                  <pubid idtype="pmpid">15985435</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p><it>Giardia</it> mitosomes and trichomonad hydrogenosomes share a common mode of protein targeting</p>
            </title>
            <aug>
               <au>
                  <snm>Dolezal</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Smid</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Rada</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Zubacova</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Bursac</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Sutak</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Nebesarova</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lithgow</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Tachezy</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci U S A</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <issue>31</issue>
            <fpage>10924</fpage>
            <lpage>10929</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1182405</pubid>
                  <pubid idtype="pmpid">16040811</pubid>
                  <pubid idtype="doi">10.1073/pnas.0500349102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>Iron-sulfur-protein biogenesis in eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Lill</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Muhlenhoff</snm>
                  <fnm>U</fnm>
               </au>
            </aug>
            <source>Trends Biochem Sci</source>
            <pubdate>2005</pubdate>
            <volume>30</volume>
            <issue>3</issue>
            <fpage>133</fpage>
            <lpage>141</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tibs.2005.01.006</pubid>
                  <pubid idtype="pmpid">15752985</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>Comparative genomics of trypanosomatid parasitic protozoa</p>
            </title>
            <aug>
               <au>
                  <snm>El-Sayed</snm>
                  <fnm>NM</fnm>
               </au>
               <au>
                  <snm>Myler</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Blandin</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Berriman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Aggarwal</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Caler</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Renauld</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Worthey</snm>
                  <fnm>EA</fnm>
               </au>
               <au>
                  <snm>Hertz-Fowler</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ghedin</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Peacock</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Bartholomeu</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Haas</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Tran</snm>
                  <fnm>AN</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Alsmark</snm>
                  <fnm>UC</fnm>
               </au>
               <au>
                  <snm>Angiuoli</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Anupama</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Badger</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bringaud</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Cadag</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Carlton</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Cerqueira</snm>
                  <fnm>GC</fnm>
               </au>
               <au>
                  <snm>Creasy</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Djikeng</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Hauser</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ivens</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Kummerfeld</snm>
                  <fnm>SK</fnm>
               </au>
               <au>
                  <snm>Pereira-Leal</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Nilsson</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Shallom</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Silva</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Sundaram</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Westenberger</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Melville</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Donelson</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Andersson</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Stuart</snm>
                  <fnm>KD</fnm>
               </au>
               <au>
                  <snm>Hall</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2005</pubdate>
            <volume>309</volume>
            <issue>5733</issue>
            <fpage>404</fpage>
            <lpage>409</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1112181</pubid>
                  <pubid idtype="pmpid">16020724</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>Genome sequence and gene compaction of the eukaryote parasite <it>Encephalitozoon cuniculi</it></p>
            </title>
            <aug>
               <au>
                  <snm>Katinka</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Duprat</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cornillot</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Metenier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Thomarat</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Prensier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Barbe</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Peyretaillade</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Brottier</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Delbac</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>El Alaoui</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Peyret</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Saurin</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Gouy</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Weissenbach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Vivares</snm>
                  <fnm>CP</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2001</pubdate>
            <volume>414</volume>
            <issue>6862</issue>
            <fpage>450</fpage>
            <lpage>453</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35106579</pubid>
                  <pubid idtype="pmpid">11719806</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>The dynamin superfamily: universal membrane tubulation and fission molecules?</p>
            </title>
            <aug>
               <au>
                  <snm>Praefcke</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>McMahon</snm>
                  <fnm>HT</fnm>
               </au>
            </aug>
            <source>Nat Rev Mol Cell Biol</source>
            <pubdate>2004</pubdate>
            <volume>5</volume>
            <issue>2</issue>
            <fpage>133</fpage>
            <lpage>147</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrm1313</pubid>
                  <pubid idtype="pmpid">15040446</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>The single dynamin-like protein of <it>Trypanosoma brucei</it> regulates mitochondrial division and is not required for endocytosis</p>
            </title>
            <aug>
               <au>
                  <snm>Morgan</snm>
                  <fnm>GW</fnm>
               </au>
               <au>
                  <snm>Goulding</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Field</snm>
                  <fnm>MC</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2004</pubdate>
            <volume>279</volume>
            <issue>11</issue>
            <fpage>10692</fpage>
            <lpage>10701</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.M312178200</pubid>
                  <pubid idtype="pmpid">14670954</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>Surface antigenic variation in <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Nash</snm>
                  <fnm>TE</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2002</pubdate>
            <volume>45</volume>
            <issue>3</issue>
            <fpage>585</fpage>
            <lpage>590</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.2002.03029.x</pubid>
                  <pubid idtype="pmpid">12139606</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>Sequence survey of the <it>Giardia lamblia</it> genome</p>
            </title>
            <aug>
               <au>
                  <snm>Smith</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Aley</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Sogin</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gillin</snm>
                  <fnm>FD</fnm>
               </au>
               <au>
                  <snm>Evans</snm>
                  <fnm>GA</fnm>
               </au>
            </aug>
            <source>Mol Biochem Parasitol</source>
            <pubdate>1998</pubdate>
            <volume>95</volume>
            <fpage>267</fpage>
            <lpage>280</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0166-6851(98)00113-3</pubid>
                  <pubid idtype="pmpid">9803418</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B61">
            <title>
               <p>Macronuclear genome sequence of the ciliate <it>Tetrahymena thermophila</it>, a model eukaryote</p>
            </title>
            <aug>
               <au>
                  <snm>Eisen</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Coyne</snm>
                  <fnm>RS</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Thiagarajan</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Badger</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Ren</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Amedeo</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Tallon</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Silva</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Haas</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Majoros</snm>
                  <fnm>WH</fnm>
               </au>
               <au>
                  <snm>Farzad</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carlton</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>RK</fnm>
               </au>
               <au>
                  <snm>Garg</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Pearlman</snm>
                  <fnm>RE</fnm>
               </au>
               <au>
                  <snm>Karrer</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Manning</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Elde</snm>
                  <fnm>NC</fnm>
               </au>
               <au>
                  <snm>Turkewitz</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Asai</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Wilkes</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Cai</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Collins</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Stewart</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Wilamowska</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Weinberg</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Ruzzo</snm>
                  <fnm>WL</fnm>
               </au>
               <au>
                  <snm>Wloga</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Gaertig</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Frankel</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tsao</snm>
                  <fnm>CC</fnm>
               </au>
               <au>
                  <snm>Gorovsky</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Keeling</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Waller</snm>
                  <fnm>RF</fnm>
               </au>
               <au>
                  <snm>Patron</snm>
                  <fnm>NJ</fnm>
               </au>
               <au>
                  <snm>Cherry</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Stover</snm>
                  <fnm>NA</fnm>
               </au>
               <au>
                  <snm>Krieger</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Del Toro</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ryder</snm>
                  <fnm>HF</fnm>
               </au>
               <au>
                  <snm>Williamson</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Barbeau</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Hamilton</snm>
                  <fnm>EP</fnm>
               </au>
               <au>
                  <snm>Orias</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>PLoS Biol</source>
            <pubdate>2006</pubdate>
            <volume>4</volume>
            <issue>9</issue>
            <fpage>e286</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1557398</pubid>
                  <pubid idtype="pmpid">16933976</pubid>
                  <pubid idtype="doi">10.1371/journal.pbio.0040286</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B62">
            <title>
               <p><it>Giardia</it> immunity - an update</p>
            </title>
            <aug>
               <au>
                  <snm>Roxstr&#246;m-Lindquist</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Palm</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Reiner</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Ringqvist</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Sv&#228;rd</snm>
                  <fnm>SG</fnm>
               </au>
            </aug>
            <source>Trends Parasitol</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <issue>1</issue>
            <fpage>26</fpage>
            <lpage>31</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.pt.2005.11.005</pubid>
                  <pubid idtype="pmpid">16303332</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B63">
            <title>
               <p><it>Spironucleus vortens</it>, a possible cause of hole-in-the-head disease in cichlids</p>
            </title>
            <aug>
               <au>
                  <snm>Paull</snm>
                  <fnm>GC</fnm>
               </au>
               <au>
                  <snm>Matthews</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>Dis Aquat Organ</source>
            <pubdate>2001</pubdate>
            <volume>45</volume>
            <issue>3</issue>
            <fpage>197</fpage>
            <lpage>202</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">11558728</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B64">
            <title>
               <p><it>Trichomonas vaginalis</it> degrades nitric oxide and expresses a flavorubredoxin-like protein: a new pathogenic mechanism?</p>
            </title>
            <aug>
               <au>
                  <snm>Sarti</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Fiori</snm>
                  <fnm>PL</fnm>
               </au>
               <au>
                  <snm>Forte</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Rappelli</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Teixeira</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Mastronicola</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Sanciu</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Giuffre</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Brunori</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Cell Mol Life Sci</source>
            <pubdate>2004</pubdate>
            <volume>61</volume>
            <issue>5</issue>
            <fpage>618</fpage>
            <lpage>623</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00018-003-3413-8</pubid>
                  <pubid idtype="pmpid">15004700</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>Role of rubrerythrin in the oxidative stress response of <it>Porphyromonas gingivalis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Sztukowska</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bugno</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Potempa</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Travis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kurtz</snm>
                  <fnm>DM</fnm>
                  <suf>Jr.</suf>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2002</pubdate>
            <volume>44</volume>
            <issue>2</issue>
            <fpage>479</fpage>
            <lpage>488</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.2002.02892.x</pubid>
                  <pubid idtype="pmpid">11972784</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>A comparison of <it>Giardia microti</it> and <it>Spironucleus muris</it> cysts in the vole: an immunocytochemical, light, and electron microscopic study</p>
            </title>
            <aug>
               <au>
                  <snm>Januschka</snm>
                  <fnm>MM</fnm>
               </au>
               <au>
                  <snm>Erlandsen</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Bemrick</snm>
                  <fnm>WJ</fnm>
               </au>
               <au>
                  <snm>Schupp</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Feely</snm>
                  <fnm>DE</fnm>
               </au>
            </aug>
            <source>J Parasitol</source>
            <pubdate>1988</pubdate>
            <volume>74</volume>
            <issue>3</issue>
            <fpage>452</fpage>
            <lpage>458</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.2307/3282055</pubid>
                  <pubid idtype="pmpid">3288741</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B67">
            <title>
               <p>Intracellular infection with <it>Spironucleus barkhanus</it> (Diplomonadida, Hexamitidae) in farmed Arctic char <it>Salvelinus alpinus</it></p>
            </title>
            <aug>
               <au>
                  <snm>Sterud</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Poppe</snm>
                  <fnm>TT</fnm>
               </au>
               <au>
                  <snm>Born&#248;</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Dis Aquat Organ</source>
            <pubdate>2003</pubdate>
            <volume>56</volume>
            <issue>2</issue>
            <fpage>155</fpage>
            <lpage>161</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">14598991</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>Antisense inhibition of <it>Entamoeba histolytica</it> cysteine proteases inhibits colonic mucus degradation</p>
            </title>
            <aug>
               <au>
                  <snm>Moncada</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Keller</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ankri</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mirelman</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Chadee</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Gastroenterology</source>
            <pubdate>2006</pubdate>
            <volume>130</volume>
            <issue>3</issue>
            <fpage>721</fpage>
            <lpage>730</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1053/j.gastro.2005.11.012</pubid>
                  <pubid idtype="pmpid">16530514</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p><it>Giardia duodenalis</it>: analysis of secreted proteases upon trophozoite-epithelial cell interaction in vitro</p>
            </title>
            <aug>
               <au>
                  <snm>Rodr&#237;guez-Fuentes</snm>
                  <fnm>GB</fnm>
               </au>
               <au>
                  <snm>Cedillo-Rivera</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Fonseca-Li&#241;&#225;n</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Arg&#252;ello-Garc&#237;a</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Mu&#241;oz</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Ortega-Pierres</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Y&#233;pez-Mulia</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Mem Inst Oswaldo Cruz</source>
            <pubdate>2006</pubdate>
            <volume>101</volume>
            <issue>6</issue>
            <fpage>693</fpage>
            <lpage>696</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1590/S0074-02762006000600020</pubid>
                  <pubid idtype="pmpid">17072486</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B70">
            <title>
               <p>A primitive enzyme for a primitive cell: the protease required for excystation of <it>Giardia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Ward</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Alvarado</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Rawlings</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Engel</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Franklin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>McKerrow</snm>
                  <fnm>JH</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1997</pubdate>
            <volume>89</volume>
            <issue>3</issue>
            <fpage>437</fpage>
            <lpage>444</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(00)80224-X</pubid>
                  <pubid idtype="pmpid">9150143</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>The activity of a developmentally regulated cysteine proteinase is required for cyst wall formation in the primitive eukaryote <it>Giardia lamblia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Touz</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Nores</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Slavin</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Carmona</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Conrad</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>Mowatt</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Nash</snm>
                  <fnm>TE</fnm>
               </au>
               <au>
                  <snm>Coronel</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Lujan</snm>
                  <fnm>HD</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2002</pubdate>
            <volume>277</volume>
            <issue>10</issue>
            <fpage>8474</fpage>
            <lpage>8481</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.M110250200</pubid>
                  <pubid idtype="pmpid">11773053</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>Codon usage between genomes is constrained by genome-wide mutational processes</p>
            </title>
            <aug>
               <au>
                  <snm>Chen</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Hottes</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Shapiro</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>McAdams</snm>
                  <fnm>HH</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci U S A</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <issue>10</issue>
            <fpage>3480</fpage>
            <lpage>3485</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">373487</pubid>
                  <pubid idtype="pmpid">14990797</pubid>
                  <pubid idtype="doi">10.1073/pnas.0307827100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>A simple model based on mutation and selection explains trends in codon and amino-acid usage and GC composition within and across genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Knight</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Freeland</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Landweber</snm>
                  <fnm>LF</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2001</pubdate>
            <volume>2</volume>
            <issue>4</issue>
            <fpage>RESEARCH0010</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1186/gb-2001-2-4-research0010</pubid>
                  <pubid idtype="pmpid">11305938</pubid>
                  <pubid idtype="pmcid">31479</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B74">
            <title>
               <p>Synonymous codon usage variation among <it>Giardia lamblia</it> genes and isolates</p>
            </title>
            <aug>
               <au>
                  <snm>Lafay</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Sharp</snm>
                  <fnm>PM</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1999</pubdate>
            <volume>16</volume>
            <issue>11</issue>
            <fpage>1484</fpage>
            <lpage>1495</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">10555279</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B75">
            <title>
               <p>Accounting for background nucleotide composition when measuring codon usage bias</p>
            </title>
            <aug>
               <au>
                  <snm>Novembre</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2002</pubdate>
            <volume>19</volume>
            <issue>8</issue>
            <fpage>1390</fpage>
            <lpage>1394</lpage>
            <xrefbib>
               <pubid idtype="pmpid">12140252</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B76">
            <title>
               <p>Comparative genomics of <it>Dictyostelium discoideum</it> and <it>Entamoeba histolytica</it></p>
            </title>
            <aug>
               <au>
                  <snm>Eichinger</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Noegel</snm>
                  <fnm>AA</fnm>
               </au>
            </aug>
            <source>Curr Opin Microbiol</source>
            <pubdate>2005</pubdate>
            <volume>8</volume>
            <fpage>606</fpage>
            <lpage>611</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.mib.2005.08.009</pubid>
                  <pubid idtype="pmpid">16125444</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B77">
            <title>
               <p>Genome sequence of the human malaria parasite <it>Plasmodium falciparum</it></p>
            </title>
            <aug>
               <au>
                  <snm>Gardner</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Hall</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Fung</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Berriman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hyman</snm>
                  <fnm>RW</fnm>
               </au>
               <au>
                  <snm>Carlton</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Pain</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>Bowman</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Paulsen</snm>
                  <fnm>IT</fnm>
               </au>
               <au>
                  <snm>James</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Eisen</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Rutherford</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Craig</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kyes</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Chan</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Nene</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Shallom</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Suh</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Angiuoli</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Pertea</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Selengut</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Haft</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mather</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Vaidya</snm>
                  <fnm>AB</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Fairlamb</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Fraunholz</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Roos</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Ralph</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>McFadden</snm>
                  <fnm>GI</fnm>
               </au>
               <au>
                  <snm>Cummings</snm>
                  <fnm>LM</fnm>
               </au>
               <au>
                  <snm>Subramanian</snm>
                  <fnm>GM</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Venter</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Carucci</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Hoffman</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Newbold</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>RW</fnm>
               </au>
               <au>
                  <snm>Fraser</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2002</pubdate>
            <volume>419</volume>
            <issue>6906</issue>
            <fpage>498</fpage>
            <lpage>511</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01097</pubid>
                  <pubid idtype="pmpid">12368864</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B78">
            <title>
               <p>G+C content variation along and among <it>Saccharomyces cerevisiae</it> chromosomes</p>
            </title>
            <aug>
               <au>
                  <snm>Bradnam</snm>
                  <fnm>KR</fnm>
               </au>
               <au>
                  <snm>Seoighe</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Sharp</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1999</pubdate>
            <volume>16</volume>
            <issue>5</issue>
            <fpage>666</fpage>
            <lpage>675</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">10335660</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B79">
            <title>
               <p>The human genome: organization and evolutionary history</p>
            </title>
            <aug>
               <au>
                  <snm>Bernardi</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Annu Rev Genet</source>
            <pubdate>1995</pubdate>
            <volume>29</volume>
            <fpage>445</fpage>
            <lpage>476</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.ge.29.120195.002305</pubid>
                  <pubid idtype="pmpid">8825483</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B80">
            <title>
               <p>Evolution of four gene families with patchy phylogenetic distribution: influx of genes into protist genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
               <au>
                  <snm>Hirt</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Foster</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Roger</snm>
                  <fnm>AJ</fnm>
               </au>
            </aug>
            <source>BMC Evol Biol</source>
            <pubdate>2006</pubdate>
            <volume>6</volume>
            <fpage>27</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1484493</pubid>
                  <pubid idtype="pmpid">16551352</pubid>
                  <pubid idtype="doi">10.1186/1471-2148-6-27</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B81">
            <title>
               <p>Iron-dependent hydrogenases of <it>Entamoeba histolytica</it> and <it>Giardia lamblia</it>: activity of the recombinant entamoebic enzyme and evidence for lateral gene transfer</p>
            </title>
            <aug>
               <au>
                  <snm>Nixon</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Field</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>McArthur</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Sogin</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Yarlett</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Loftus</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Samuelson</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Biol Bull</source>
            <pubdate>2003</pubdate>
            <volume>204</volume>
            <issue>1</issue>
            <fpage>1</fpage>
            <lpage>9</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.2307/1543490</pubid>
                  <pubid idtype="pmpid">12588739</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B82">
            <title>
               <p>Evidence for lateral transfer of genes encoding ferredoxins, nitroreductases, NADH oxidase, and alcohol dehydrogenase 3 from anaerobic prokaryotes to <it>Giardia lamblia</it> and <it>Entamoeba histolytica</it></p>
            </title>
            <aug>
               <au>
                  <snm>Nixon</snm>
                  <fnm>JEJ</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Field</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Morrison</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>McArthur</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Sogin</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Loftus</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Samuelson</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Eukaryot Cell</source>
            <pubdate>2002</pubdate>
            <volume>1</volume>
            <issue>2</issue>
            <fpage>181</fpage>
            <lpage>190</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">118039</pubid>
                  <pubid idtype="pmpid">12455953</pubid>
                  <pubid idtype="doi">10.1128/EC.1.2.181-190.2002</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B83">
            <title>
               <p>PhyloGenie: automated phylome generation and analysis</p>
            </title>
            <aug>
               <au>
                  <snm>Frickey</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lupas</snm>
                  <fnm>AN</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <issue>17</issue>
            <fpage>5231</fpage>
            <lpage>5238</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">521674</pubid>
                  <pubid idtype="pmpid">15459293</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh867</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B84">
            <title>
               <p>Rewiring the keyboard: evolvability of the genetic code</p>
            </title>
            <aug>
               <au>
                  <snm>Knight</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Freeland</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Landweber</snm>
                  <fnm>LF</fnm>
               </au>
            </aug>
            <source>Nat Rev Genet</source>
            <pubdate>2001</pubdate>
            <volume>2</volume>
            <issue>1</issue>
            <fpage>49</fpage>
            <lpage>58</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35047500</pubid>
                  <pubid idtype="pmpid">11253070</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B85">
            <title>
               <p>Much ado about bacteria-to-vertebrate lateral gene transfer</p>
            </title>
            <aug>
               <au>
                  <snm>Genereux</snm>
                  <fnm>DP</fnm>
               </au>
               <au>
                  <snm>Logsdon</snm>
                  <fnm>JM</fnm>
                  <suf>Jr.</suf>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <issue>4</issue>
            <fpage>191</fpage>
            <lpage>195</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0168-9525(03)00055-6</pubid>
                  <pubid idtype="pmpid">12683971</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B86">
            <title>
               <p>Non-mitochondrial complex I proteins in a hydrogenosomal oxidoreductase complex</p>
            </title>
            <aug>
               <au>
                  <snm>Dyall</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Delgadillo-Correa</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Lunceford</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Loo</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Clarke</snm>
                  <fnm>CF</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>PJ</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>431</volume>
            <issue>7012</issue>
            <fpage>1103</fpage>
            <lpage>1107</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature02990</pubid>
                  <pubid idtype="pmpid">15510149</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B87">
            <title>
               <p><it>Trichomonas</it> hydrogenosomes contain the NADH dehydrogenase module of mitochondrial complex I</p>
            </title>
            <aug>
               <au>
                  <snm>Hrdy</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Hirt</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Dolezal</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Bardonova</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Foster</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Tachezy</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>432</volume>
            <issue>7017</issue>
            <fpage>618</fpage>
            <lpage>622</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03149</pubid>
                  <pubid idtype="pmpid">15577909</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B88">
            <title>
               <p>Horizontal gene transfer among genomes: the complexity hypothesis</p>
            </title>
            <aug>
               <au>
                  <snm>Jain</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Rivera</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Lake</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci U S A</source>
            <pubdate>1999</pubdate>
            <volume>96</volume>
            <fpage>3801</fpage>
            <lpage>3806</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">22375</pubid>
                  <pubid idtype="pmpid">10097118</pubid>
                  <pubid idtype="doi">10.1073/pnas.96.7.3801</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B89">
            <title>
               <p>Highways of gene sharing in prokaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Beiko</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Harlow</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Ragan</snm>
                  <fnm>MA</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci U S A</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <issue>40</issue>
            <fpage>14332</fpage>
            <lpage>14337</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1242295</pubid>
                  <pubid idtype="pmpid">16176988</pubid>
                  <pubid idtype="doi">10.1073/pnas.0504068102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B90">
            <title>
               <p>Bacterial-like energy metabolism in the amitochondriate protozoon <it>Hexamita inflata</it></p>
            </title>
            <aug>
               <au>
                  <snm>Biagini</snm>
                  <fnm>GA</fnm>
               </au>
               <au>
                  <snm>Yarlett</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Ball</snm>
                  <fnm>GE</fnm>
               </au>
               <au>
                  <snm>Billetz</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Lindmark</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Martinez</snm>
                  <fnm>MP</fnm>
               </au>
               <au>
                  <snm>Lloyd</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Edwards</snm>
                  <fnm>MR</fnm>
               </au>
            </aug>
            <source>Mol Biochem Parasitol</source>
            <pubdate>2003</pubdate>
            <volume>128</volume>
            <issue>1</issue>
            <fpage>11</fpage>
            <lpage>19</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0166-6851(03)00025-2</pubid>
                  <pubid idtype="pmpid">12706792</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B91">
            <title>
               <p>Phylogenomic evidence supports past endosymbiosis, intracellular and horizontal gene transfer in <it>Cryptosporidium parvum</it></p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Mullapudi</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Lancto</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Scott</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Abrahamsen</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Kissinger</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2004</pubdate>
            <volume>5</volume>
            <issue>11</issue>
            <fpage>R88</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">545779</pubid>
                  <pubid idtype="pmpid">15535864</pubid>
                  <pubid idtype="doi">10.1186/gb-2004-5-11-r88</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B92">
            <title>
               <p>Horizontal gene transfer from bacteria to rumen ciliates indicates adaptation to their anaerobic carbohydrates rich environment</p>
            </title>
            <aug>
               <au>
                  <snm>Ricard</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>McEwan</snm>
                  <fnm>NR</fnm>
               </au>
               <au>
                  <snm>Dutilh</snm>
                  <fnm>BE</fnm>
               </au>
               <au>
                  <snm>Jouany</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Macheboeuf</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mitsumori</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>McIntosh</snm>
                  <fnm>FM</fnm>
               </au>
               <au>
                  <snm>Michalowski</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nagamine</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Newbold</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>Nsabimana</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Takenaka</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Thomas</snm>
                  <fnm>NA</fnm>
               </au>
               <au>
                  <snm>Ushida</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Hackstein</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Huynen</snm>
                  <fnm>MA</fnm>
               </au>
            </aug>
            <source>BMC Genomics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <issue>1</issue>
            <fpage>22</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1413528</pubid>
                  <pubid idtype="pmpid">16472398</pubid>
                  <pubid idtype="doi">10.1186/1471-2164-7-22</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B93">
            <title>
               <p>You are what you eat: a gene transfer ratchet could account for bacterial genes in eukaryotic nuclear genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Doolittle</snm>
                  <fnm>WF</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>1998</pubdate>
            <volume>14</volume>
            <fpage>307</fpage>
            <lpage>311</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0168-9525(98)01494-2</pubid>
                  <pubid idtype="pmpid">9724962</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B94">
            <title>
               <p>Horizontal gene transfer and the evolution of parasitic protozoa</p>
            </title>
            <aug>
               <au>
                  <snm>Richards</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Hirt</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Embley</snm>
                  <fnm>TM</fnm>
               </au>
            </aug>
            <source>Protist</source>
            <pubdate>2003</pubdate>
            <volume>154</volume>
            <issue>1</issue>
            <fpage>17</fpage>
            <lpage>32</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1078/143446103764928468</pubid>
                  <pubid idtype="pmpid">12812367</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B95">
            <title>
               <p>Gene transfer: gene swapping craze reaches eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Gogarten</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2003</pubdate>
            <volume>13</volume>
            <issue>2</issue>
            <fpage>R53</fpage>
            <lpage>R54</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0960-9822(02)01426-4</pubid>
                  <pubid idtype="pmpid">12546803</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B96">
            <title>
               <p>Common themes in the genome strategies of pathogens</p>
            </title>
            <aug>
               <au>
                  <snm>Lawrence</snm>
                  <fnm>JG</fnm>
               </au>
            </aug>
            <source>Curr Opin Genet Dev</source>
            <pubdate>2005</pubdate>
            <volume>15</volume>
            <issue>6</issue>
            <fpage>584</fpage>
            <lpage>588</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.gde.2005.09.007</pubid>
                  <pubid idtype="pmpid">16188434</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B97">
            <title>
               <p>Genome evolution of anaerobic protists: metabolic adaptation via gene acquisition</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
            </aug>
            <source>Genomics and Evolution of Microbial Eukaryotes</source>
            <publisher>Oxford , Oxford University Press</publisher>
            <editor>Katz LA, Bhattacharya D</editor>
            <pubdate>2006</pubdate>
            <fpage>109</fpage>
            <lpage>122</lpage>
         </bibl>
         <bibl id="B98">
            <title>
               <p>Codon bias and base composition are poor indicators of horizontally transferred genes</p>
            </title>
            <aug>
               <au>
                  <snm>Koski</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>Morton</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Golding</snm>
                  <fnm>GB</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2001</pubdate>
            <volume>18</volume>
            <issue>3</issue>
            <fpage>404</fpage>
            <lpage>412</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11230541</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B99">
            <title>
               <p>Ancient horizontal gene transfer can benefit phylogenetic reconstruction</p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Gogarten</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <issue>7</issue>
            <fpage>361</fpage>
            <lpage>6</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tig.2006.05.004</pubid>
                  <pubid idtype="pmpid">16730850</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B100">
            <title>
               <p>Evolution of filamentous plant pathogens: gene exchange across eukaryotic kingdoms</p>
            </title>
            <aug>
               <au>
                  <snm>Richards</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Dacks</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Jenkinson</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Thornton</snm>
                  <fnm>CR</fnm>
               </au>
               <au>
                  <snm>Talbot</snm>
                  <fnm>NJ</fnm>
               </au>
            </aug>
            <source>Curr Biol</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>1857</fpage>
            <lpage>1864</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.cub.2006.07.052</pubid>
                  <pubid idtype="pmpid">16979565</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B101">
            <title>
               <p>Emergence of a new disease as a result of interspecific virulence gene transfer</p>
            </title>
            <aug>
               <au>
                  <snm>Friesen</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Stukenbrock</snm>
                  <fnm>EH</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Meinhardt</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ling</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Faris</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Rasmussen</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Solomon</snm>
                  <fnm>PS</fnm>
               </au>
               <au>
                  <snm>McDonald</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Oliver</snm>
                  <fnm>RP</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>2006</pubdate>
            <volume>38</volume>
            <issue>8</issue>
            <fpage>953</fpage>
            <lpage>956</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/ng1839</pubid>
                  <pubid idtype="pmpid">16832356</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B102">
            <title>
               <p>Evidence from SSU rRNA phylogeny that <it>Octomitus</it> is a sister lineage to <it>Giardia</it></p>
            </title>
            <aug>
               <au>
                  <snm>Keeling</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Brugerolle</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Protist</source>
            <pubdate>2006</pubdate>
            <volume>157</volume>
            <issue>2</issue>
            <fpage>205</fpage>
            <lpage>12</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.protis.2006.01.003</pubid>
                  <pubid idtype="pmpid">16618550</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B103">
            <title>
               <p>The <it>Giardia</it> genome project database</p>
            </title>
            <aug>
               <au>
                  <snm>McArthur</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Morrison</snm>
                  <fnm>HG</fnm>
               </au>
               <au>
                  <snm>Nixon</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Passamaneck</snm>
                  <fnm>NQ</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Hinkle</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Crocker</snm>
                  <fnm>MK</fnm>
               </au>
               <au>
                  <snm>Holder</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Farr</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Reich</snm>
                  <fnm>CI</fnm>
               </au>
               <au>
                  <snm>Olsen</snm>
                  <fnm>GE</fnm>
               </au>
               <au>
                  <snm>Aley</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Adam</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Gillin</snm>
                  <fnm>FD</fnm>
               </au>
               <au>
                  <snm>Sogin</snm>
                  <fnm>ML</fnm>
               </au>
            </aug>
            <source>FEMS Microbiol Lett</source>
            <pubdate>2000</pubdate>
            <volume>189</volume>
            <issue>2</issue>
            <fpage>271</fpage>
            <lpage>273</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1574-6968.2000.tb09242.x</pubid>
                  <pubid idtype="pmpid">10930750</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B104">
            <title>
               <p>DOE Joint Genome Institute</p>
            </title>
            <url>http://www.jgi.doe.gov/</url>
         </bibl>
         <bibl id="B105">
            <title>
               <p><it>In vitro</it> cultivation and temperature-dependent growth of two strains of <it>Spironucleus barkhanus</it> (Diplomonadida: Hexamitidae) from Atlantic salmon <it>Salmo salar</it> and grayling <it>Thymallus thymallus</it></p>
            </title>
            <aug>
               <au>
                  <snm>Sterud</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Dis Aquat Organ</source>
            <pubdate>1998</pubdate>
            <volume>33</volume>
            <issue>1</issue>
            <fpage>57</fpage>
            <lpage>61</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">9653459</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B106">
            <title>
               <p>Laboratory of Phil Green</p>
            </title>
            <url>http://www.phrap.org/</url>
         </bibl>
         <bibl id="B107">
            <title>
               <p>WebLogo: a sequence logo generator</p>
            </title>
            <aug>
               <au>
                  <snm>Crooks</snm>
                  <fnm>GE</fnm>
               </au>
               <au>
                  <snm>Hon</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Chandonia</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Brenner</snm>
                  <fnm>SE</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <issue>6</issue>
            <fpage>1188</fpage>
            <lpage>1190</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">419797</pubid>
                  <pubid idtype="pmpid">15173120</pubid>
                  <pubid idtype="doi">10.1101/gr.849004</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B108">
            <title>
               <p>Staden package home page</p>
            </title>
            <url>http://staden.sourceforge.net/</url>
         </bibl>
         <bibl id="B109">
            <title>
               <p>Genomic mapping by fingerprinting random clones: a mathematical analysis</p>
            </title>
            <aug>
               <au>
                  <snm>Lander</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Waterman</snm>
                  <fnm>MS</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>1988</pubdate>
            <volume>2</volume>
            <issue>3</issue>
            <fpage>231</fpage>
            <lpage>239</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0888-7543(88)90007-9</pubid>
                  <pubid idtype="pmpid">3294162</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B110">
            <title>
               <p>National Center for Biotechnology Information</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/</url>
         </bibl>
         <bibl id="B111">
            <title>
               <p>The Institute for Genomic Research</p>
            </title>
            <url>http://www.tigr.org/</url>
         </bibl>
         <bibl id="B112">
            <title>
               <p>dictyBase home page</p>
            </title>
            <url>http://dictybase.org/</url>
         </bibl>
         <bibl id="B113">
            <title>
               <p>KEGG: Kyoto Encyclopedia of Genes and Genomes</p>
            </title>
            <url>http://www.genome.jp/kegg/</url>
         </bibl>
         <bibl id="B114">
            <title>
               <p>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Madden</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Schaffer</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <fpage>3389</fpage>
            <lpage>3402</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">146917</pubid>
                  <pubid idtype="pmpid">9254694</pubid>
                  <pubid idtype="doi">10.1093/nar/25.17.3389</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B115">
            <title>
               <p>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence</p>
            </title>
            <aug>
               <au>
                  <snm>Lowe</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <issue>5</issue>
            <fpage>955</fpage>
            <lpage>964</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">146525</pubid>
                  <pubid idtype="pmpid">9023104</pubid>
                  <pubid idtype="doi">10.1093/nar/25.5.955</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B116">
            <title>
               <p>ARAGORN, a program to detect tRNA genes and tmRNA genes in nucleotide sequences</p>
            </title>
            <aug>
               <au>
                  <snm>Laslett</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Canback</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <issue>1</issue>
            <fpage>11</fpage>
            <lpage>16</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">373265</pubid>
                  <pubid idtype="pmpid">14704338</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh152</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B117">
            <title>
               <p>The 'effective number of codons' used in a gene</p>
            </title>
            <aug>
               <au>
                  <snm>Wright</snm>
                  <fnm>F</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>1990</pubdate>
            <volume>87</volume>
            <issue>1</issue>
            <fpage>23</fpage>
            <lpage>29</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0378-1119(90)90491-9</pubid>
                  <pubid idtype="pmpid">2110097</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B118">
            <title>
               <p>INCA: synonymous codon usage analysis and clustering by means of self-organizing map</p>
            </title>
            <aug>
               <au>
                  <snm>Supek</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Vlahovicek</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2004</pubdate>
            <volume>20</volume>
            <issue>14</issue>
            <fpage>2329</fpage>
            <lpage>2330</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/bth238</pubid>
                  <pubid idtype="pmpid">15059815</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B119">
            <title>
               <p>Correspondence analysis of codon usage</p>
            </title>
            <url>http://codonw.sourceforge.net/</url>
         </bibl>
         <bibl id="B120">
            <title>
               <p>KEGG: Kyoto Encyclopedia of Genes and Genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Kanehisa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Goto</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2000</pubdate>
            <volume>28</volume>
            <issue>1</issue>
            <fpage>27</fpage>
            <lpage>30</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">102409</pubid>
                  <pubid idtype="pmpid">10592173</pubid>
                  <pubid idtype="doi">10.1093/nar/28.1.27</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B121">
            <title>
               <p>CYGD: the Comprehensive Yeast Genome Database</p>
            </title>
            <aug>
               <au>
                  <snm>G&#252;ldener</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>M&#252;nsterk&#246;tter</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kastenm&#252;ller</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Strack</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>van Helden</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lemer</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Richelles</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wodak</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Garc&#237;a-Mart&#237;nez</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>P&#233;rez-Ortin</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Michael</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kaps</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Talla</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Dujon</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Andre</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Souciet</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>De Montigny</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bon</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Gaillardin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2005</pubdate>
            <volume>33</volume>
            <issue>Database issue</issue>
            <fpage>D364</fpage>
            <lpage>8</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">540007</pubid>
                  <pubid idtype="pmpid">15608217</pubid>
                  <pubid idtype="doi">10.1093/nar/gki053</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B122">
            <title>
               <p>The closest BLAST hit is often not the nearest neighbor</p>
            </title>
            <aug>
               <au>
                  <snm>Koski</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>Golding</snm>
                  <fnm>GB</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>2001</pubdate>
            <volume>52</volume>
            <issue>6</issue>
            <fpage>540</fpage>
            <lpage>542</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11443357</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B123">
            <title>
               <p>HMMER: sequence analysis using profile hidden Markov models</p>
            </title>
            <url>http://hmmer.janelia.org</url>
         </bibl>
         <bibl id="B124">
            <title>
               <p>A general empirical model of protein evolution derived from multiple protein families using a maximum-likelihood approach</p>
            </title>
            <aug>
               <au>
                  <snm>Whelan</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Goldman</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2001</pubdate>
            <volume>18</volume>
            <issue>5</issue>
            <fpage>691</fpage>
            <lpage>699</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11319253</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B125">
            <title>
               <p>SMART 4.0: towards genomic data integration</p>
            </title>
            <aug>
               <au>
                  <snm>Letunic</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Copley</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Schmidt</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ciccarelli</snm>
                  <fnm>FD</fnm>
               </au>
               <au>
                  <snm>Doerks</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Schultz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ponting</snm>
                  <fnm>CP</fnm>
               </au>
               <au>
                  <snm>Bork</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <issue>Database issue</issue>
            <fpage>D142</fpage>
            <lpage>4</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308822</pubid>
                  <pubid idtype="pmpid">14681379</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh088</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B126">
            <title>
               <p>Predicting transmembrane protein topology with a hidden Markov model: application to complete genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Krogh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Larsson</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>von Heijne</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Sonnhammer</snm>
                  <fnm>EL</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>2001</pubdate>
            <volume>305</volume>
            <issue>3</issue>
            <fpage>567</fpage>
            <lpage>580</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/jmbi.2000.4315</pubid>
                  <pubid idtype="pmpid">11152613</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B127">
            <title>
               <p>T-Coffee: A novel method for fast and accurate multiple sequence alignment</p>
            </title>
            <aug>
               <au>
                  <snm>Notredame</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Higgins</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Heringa</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>2000</pubdate>
            <volume>302</volume>
            <issue>1</issue>
            <fpage>205</fpage>
            <lpage>217</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/jmbi.2000.4042</pubid>
                  <pubid idtype="pmpid">10964570</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B128">
            <title>
               <p>Improved prediction of signal peptides: SignalP 3.0</p>
            </title>
            <aug>
               <au>
                  <snm>Bendtsen</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>von Heijne</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Brunak</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>2004</pubdate>
            <volume>340</volume>
            <issue>4</issue>
            <fpage>783</fpage>
            <lpage>795</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.jmb.2004.05.028</pubid>
                  <pubid idtype="pmpid">15223320</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B129">
            <title>
               <p>VSP417-6, a variant-specific surface protein encoded at a sixth locus within the vsp417 gene subfamily of <it>Giardia intestinalis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Ey</snm>
                  <fnm>PL</fnm>
               </au>
               <au>
                  <snm>Darby</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Int J Parasitol</source>
            <pubdate>2002</pubdate>
            <volume>32</volume>
            <issue>4</issue>
            <fpage>425</fpage>
            <lpage>436</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0020-7519(01)00366-6</pubid>
                  <pubid idtype="pmpid">11849639</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>

