<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-10-145</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>The complete genome sequence of <it>Staphylothermus marinus </it>reveals differences in sulfur metabolism among heterotrophic Crenarchaeota</p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Anderson</snm>
               <mi>J</mi>
               <fnm>Iain</fnm>
               <insr iid="I1"/>
               <email>IJAnderson@lbl.gov</email>
            </au>
            <au id="A2">
               <snm>Dharmarajan</snm>
               <fnm>Lakshmi</fnm>
               <insr iid="I2"/>
               <email>laxo82@vt.edu</email>
            </au>
            <au id="A3">
               <snm>Rodriguez</snm>
               <fnm>Jason</fnm>
               <insr iid="I2"/>
               <insr iid="I3"/>
               <email>jrodri@vt.edu</email>
            </au>
            <au id="A4">
               <snm>Hooper</snm>
               <fnm>Sean</fnm>
               <insr iid="I1"/>
               <email>SHooper@lbl.gov</email>
            </au>
            <au id="A5">
               <snm>Porat</snm>
               <fnm>Iris</fnm>
               <insr iid="I4"/>
               <insr iid="I13"/>
               <email>porati@ornl.gov</email>
            </au>
            <au id="A6">
               <snm>Ulrich</snm>
               <mi>E</mi>
               <fnm>Luke</fnm>
               <insr iid="I5"/>
               <email>ulrich.luke@gmail.com</email>
            </au>
            <au id="A7">
               <snm>Elkins</snm>
               <mi>G</mi>
               <fnm>James</fnm>
               <insr iid="I6"/>
               <email>elkinsjg@ornl.gov</email>
            </au>
            <au id="A8">
               <snm>Mavromatis</snm>
               <fnm>Kostas</fnm>
               <insr iid="I1"/>
               <email>KMavrommatis@lbl.gov</email>
            </au>
            <au id="A9">
               <snm>Sun</snm>
               <fnm>Hui</fnm>
               <insr iid="I7"/>
               <email>HSun@lbl.gov</email>
            </au>
            <au id="A10">
               <snm>Land</snm>
               <fnm>Miriam</fnm>
               <insr iid="I6"/>
               <email>landml@ornl.gov</email>
            </au>
            <au id="A11">
               <snm>Lapidus</snm>
               <fnm>Alla</fnm>
               <insr iid="I7"/>
               <email>ALapidus@lbl.gov</email>
            </au>
            <au id="A12">
               <snm>Lucas</snm>
               <fnm>Susan</fnm>
               <insr iid="I7"/>
               <email>lucas11@llnl.gov</email>
            </au>
            <au id="A13">
               <snm>Barry</snm>
               <fnm>Kerrie</fnm>
               <insr iid="I8"/>
               <email>KWBarry@lbl.gov</email>
            </au>
            <au id="A14">
               <snm>Huber</snm>
               <fnm>Harald</fnm>
               <insr iid="I9"/>
               <email>harald.huber@biologie.uni-regensburg.de</email>
            </au>
            <au id="A15">
               <snm>Zhulin</snm>
               <mi>B</mi>
               <fnm>Igor</fnm>
               <insr iid="I5"/>
               <email>ijouline@utk.edu</email>
            </au>
            <au id="A16">
               <snm>Whitman</snm>
               <mi>B</mi>
               <fnm>William</fnm>
               <insr iid="I4"/>
               <email>whitman@uga.edu</email>
            </au>
            <au id="A17">
               <snm>Mukhopadhyay</snm>
               <fnm>Biswarup</fnm>
               <insr iid="I2"/>
               <insr iid="I3"/>
               <insr iid="I10"/>
               <email>biswarup@vt.edu</email>
            </au>
            <au id="A18">
               <snm>Woese</snm>
               <fnm>Carl</fnm>
               <insr iid="I11"/>
               <email>carl@life.uiuc.edu</email>
            </au>
            <au id="A19">
               <snm>Bristow</snm>
               <fnm>James</fnm>
               <insr iid="I12"/>
               <email>JBristow@lbl.gov</email>
            </au>
            <au id="A20">
               <snm>Kyrpides</snm>
               <fnm>Nikos</fnm>
               <insr iid="I1"/>
               <email>NCKyrpides@lbl.gov</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Genome Biology Program, Joint Genome Institute, Walnut Creek, USA</p>
            </ins>
            <ins id="I2">
               <p>Virginia Bioinformatics Institute, Virginia Polytechnic Institute and State University, Blacksburg, USA</p>
            </ins>
            <ins id="I3">
               <p>Department of Biochemistry, Virginia Polytechnic Institute and State University, Blacksburg, USA</p>
            </ins>
            <ins id="I4">
               <p>Department of Microbiology, University of Georgia, Athens, USA</p>
            </ins>
            <ins id="I5">
               <p>Joint Institute for Computational Sciences, University of Tennessee &#8211; Oak Ridge National Laboratory, Oak Ridge, USA</p>
            </ins>
            <ins id="I6">
               <p>Biosciences Division, Oak Ridge National Laboratory, Oak Ridge, USA</p>
            </ins>
            <ins id="I7">
               <p>Production Department, Joint Genome Institute, Walnut Creek, USA</p>
            </ins>
            <ins id="I8">
               <p>Project Management Department, Joint Genome Institute, Walnut Creek, USA</p>
            </ins>
            <ins id="I9">
               <p>Lehrstuhl f&#252;r Mikrobiologie und Archaeenzentrum, Universit&#228;t Regensburg, Regensburg, Germany</p>
            </ins>
            <ins id="I10">
               <p>Biological Sciences Department, Virginia Polytechnic Institute and State University, Blacksburg, USA</p>
            </ins>
            <ins id="I11">
               <p>Department of Microbiology, University of Illinois, Urbana USA</p>
            </ins>
            <ins id="I12">
               <p>Programs Department, Joint Genome Institute, Walnut Creek, USA</p>
            </ins>
            <ins id="I13">
               <p>Biological and Environmental Sciences Directorate, Oak Ridge National Laboratory, Oak Ridge, USA</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2009</pubdate>
         <volume>10</volume>
         <issue>1</issue>
         <fpage>145</fpage>
         <url>http://www.biomedcentral.com/1471-2164/10/145</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">19341479</pubid>
               <pubid idtype="doi">10.1186/1471-2164-10-145</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>05</day>
               <month>9</month>
               <year>2008</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>02</day>
               <month>4</month>
               <year>2009</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>02</day>
               <month>4</month>
               <year>2009</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2009</year>
         <collab>Anderson et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p><it>Staphylothermus marinus </it>is an anaerobic, sulfur-reducing peptide fermenter of the archaeal phylum Crenarchaeota. It is the third heterotrophic, obligate sulfur reducing crenarchaeote to be sequenced and provides an opportunity for comparative analysis of the three genomes.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The 1.57 Mbp genome of the hyperthermophilic crenarchaeote <it>Staphylothermus marinus </it>has been completely sequenced. The main energy generating pathways likely involve 2-oxoacid:ferredoxin oxidoreductases and ADP-forming acetyl-CoA synthases. <it>S. marinus </it>possesses several enzymes not present in other crenarchaeotes including a sodium ion-translocating decarboxylase likely to be involved in amino acid degradation. <it>S. marinus </it>lacks sulfur-reducing enzymes present in the other two sulfur-reducing crenarchaeotes that have been sequenced &#8211; <it>Thermofilum pendens </it>and <it>Hyperthermus butylicus</it>. Instead it has three operons similar to the <it>mbh </it>and <it>mbx </it>operons of <it>Pyrococcus furiosus</it>, which may play a role in sulfur reduction and/or hydrogen production. The two marine organisms, <it>S. marinus </it>and <it>H. butylicus</it>, possess more sodium-dependent transporters than <it>T. pendens </it>and use symporters for potassium uptake while <it>T. pendens </it>uses an ATP-dependent potassium transporter. <it>T. pendens </it>has adapted to a nutrient-rich environment while <it>H. butylicus </it>is adapted to a nutrient-poor environment, and <it>S. marinus </it>lies between these two extremes.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>The three heterotrophic sulfur-reducing crenarchaeotes have adapted to their habitats, terrestrial vs. marine, via their transporter content, and they have also adapted to environments with differing levels of nutrients. Despite the fact that they all use sulfur as an electron acceptor, they are likely to have different pathways for sulfur reduction.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Crenarchaeota is one of the two major phyla of the domain Archaea. Many crenarchaeotes are heterotrophic, anaerobic, sulfur-reducing hyperthermophiles, but the crenarchaeotes with completely sequenced genomes are primarily aerobes. Of the archaea with published genomes, only <it>Hyperthermus butylicus </it>and <it>Thermofilum pendens </it>are heterotrophic, obligate sulfur-reducing anaerobes <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr></abbrgrp>. More genomes are needed from anaerobic crenarchaeotes in order to determine if their phenotypic similarities are reflected in their genomes.</p>
         <p><it>Staphylothermus marinus </it>was isolated from a black smoker and from volcanically heated sediments <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. It is a hyperthermophile, with a maximum growth temperature of 98&#176;C. Its name reflects its proclivity to form clusters of up to 100 cells. At high concentrations of yeast extract it forms large cells up to 15 &#956;m in diameter. It is a strict anaerobe and grows heterotrophically on complex media. H<sub>2</sub>S, CO<sub>2</sub>, acetate and isovalerate are metabolic products, suggesting a metabolism similar to that of the Thermococcales of the phylum Euryarchaeota. Dark granules observed within the cytoplasm may consist of glycogen. While <it>S. marinus </it>can survive in the absence of sulfur and produce hydrogen rather than H<sub>2</sub>S, it requires sulfur for growth <abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. An unusual cell surface protein named tetrabrachion has been characterized from <it>S. marinus </it><abbrgrp><abbr bid="B5">5</abbr></abbrgrp>, and a 24-subunit phosphoenolpyruvate-utilizing enzyme with a unique structure has also been studied <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>.</p>
         <p>Here we report the complete genome of the anaerobic, sulfur-reducing archaeon <it>S. marinus </it>and a comparative analysis with other sulfur-reducing heterotrophic crenarchaeotes. While some features in <it>S. marinus </it>are similar to <it>H. butylicus </it><abbrgrp><abbr bid="B7">7</abbr></abbrgrp> and <it>T. pendens </it><abbrgrp><abbr bid="B8">8</abbr></abbrgrp>, including peptide fermentation enzymes, there are also major differences, particularly in the electron transport machinery.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>General features</p>
            </st>
            <p>The genome of <it>S. marinus </it>F1 consists of a circular chromosome of 1.57 Mbp. There is one copy each of 5S, 16S, and 23S ribosomal RNA. About 59% of protein-coding genes begin with an AUG codon, 8% with GUG, and 33% with UUG. The low number of GUG start codons reflects the low GC content of this genome (35.7% GC). The ribosomal protein L12ae gene (Smar_1096) does not have a valid start codon, but this is likely to be an essential gene. Based on alignment with L12ae proteins from other archaea, it appears that the <it>S. marinus </it>gene begins with an ATC start codon. <it>S. marinus </it>has 12 regions of CRISPR repeats containing between 5 and 17 repeats. Twelve CRISPR-associated proteins are found in the vicinity of three of the repeats, between coordinates 323,400 and 345,500 (Smar_0308-Smar_0325), and one other CRISPR-associated protein is found at a different location not close to any repeats (Smar_1195).</p>
            <p>The genome statistics for <it>S. marinus </it>and the two other sulfur-reducing crenarchaeotes are presented in Table <tblr tid="T1">1</tblr>. While the genome of <it>H. butylicus </it>is larger than that of <it>S. marinus</it>, they both have approximately the same number of genes due to the lower coding percentage of <it>H. butylicus</it>. <it>T. pendens </it>has a larger genome and a greater number of genes than the other two (discussed below). The GC content of <it>S. marinus </it>is much lower than the others, but this is not unusual for a hyperthermophile. It is in the same range as the GC content of the <it>Sulfolobus </it>genomes, while <it>Methanocaldococcus jannaschii </it>and <it>Nanoarchaeum equitans </it>have lower GC contents (31% and 32% respectively). <it>T. pendens </it>has a much higher percentage of genes in paralog clusters than the others, suggesting that gene duplication and divergence have been more prevalent in this genome. <it>S. marinus </it>has a smaller percentage of genes with signal peptides. In all three genomes the predicted exported proteins are primarily ABC transporter substrate-binding proteins and hypothetical proteins. <it>S. marinus </it>has approximately the same number of ABC transporters for uptake of nutrients as <it>H. butylicus</it>, but they both have fewer than <it>T. pendens</it>.</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Genome statistics.</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. marinus</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>H. butylicus</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>T. pendens</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genome size (bp)</p>
                     </c>
                     <c ca="left">
                        <p>1,570,485</p>
                     </c>
                     <c ca="left">
                        <p>1,667,163</p>
                     </c>
                     <c ca="left">
                        <p>1,813,393</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Coding region (bp)</p>
                     </c>
                     <c ca="left">
                        <p>1,399,012 (89.1%)</p>
                     </c>
                     <c ca="left">
                        <p>1,385,726 (83.1%)</p>
                     </c>
                     <c ca="left">
                        <p>1,651,626 (91.1%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>G+C content (bp)</p>
                     </c>
                     <c ca="left">
                        <p>561,080 (35.7%)</p>
                     </c>
                     <c ca="left">
                        <p>895,879 (53.7%)</p>
                     </c>
                     <c ca="left">
                        <p>1,045,351 (57.6%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total genes</p>
                     </c>
                     <c ca="left">
                        <p>1655</p>
                     </c>
                     <c ca="left">
                        <p>1668</p>
                     </c>
                     <c ca="left">
                        <p>1923</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>RNA genes</p>
                     </c>
                     <c ca="left">
                        <p>45 (2.7%)</p>
                     </c>
                     <c ca="left">
                        <p>52 (3.1%)</p>
                     </c>
                     <c ca="left">
                        <p>40 (2.1%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Protein-coding genes</p>
                     </c>
                     <c ca="left">
                        <p>1610 (97.3%)</p>
                     </c>
                     <c ca="left">
                        <p>1616 (96.9%)</p>
                     </c>
                     <c ca="left">
                        <p>1883 (97.9%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes with function prediction</p>
                     </c>
                     <c ca="left">
                        <p>974 (58.9%)</p>
                     </c>
                     <c ca="left">
                        <p>981 (58.8%)</p>
                     </c>
                     <c ca="left">
                        <p>1170 (60.8%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes in ortholog clusters</p>
                     </c>
                     <c ca="left">
                        <p>1391 (84.0%)</p>
                     </c>
                     <c ca="left">
                        <p>1380 (82.7%)</p>
                     </c>
                     <c ca="left">
                        <p>1559 (81.1%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes in paralog clusters</p>
                     </c>
                     <c ca="left">
                        <p>542 (32.7%)</p>
                     </c>
                     <c ca="left">
                        <p>488 (29.3%)</p>
                     </c>
                     <c ca="left">
                        <p>805 (41.9%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes assigned to COGs</p>
                     </c>
                     <c ca="left">
                        <p>1109 (67.0%)</p>
                     </c>
                     <c ca="left">
                        <p>1114 (66.8%)</p>
                     </c>
                     <c ca="left">
                        <p>1264 (65.7%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes assigned Pfam domains</p>
                     </c>
                     <c ca="left">
                        <p>1062 (64.2%)</p>
                     </c>
                     <c ca="left">
                        <p>1042 (62.5%)</p>
                     </c>
                     <c ca="left">
                        <p>1215 (63.2%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes with signal peptides</p>
                     </c>
                     <c ca="left">
                        <p>37 (2.2%)</p>
                     </c>
                     <c ca="left">
                        <p>70 (4.2%)</p>
                     </c>
                     <c ca="left">
                        <p>134 (7.0%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genes with transmembrane helices</p>
                     </c>
                     <c ca="left">
                        <p>348 (21.0%)</p>
                     </c>
                     <c ca="left">
                        <p>294 (17.6%)</p>
                     </c>
                     <c ca="left">
                        <p>437 (22.7%)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Fusion genes</p>
                     </c>
                     <c ca="left">
                        <p>44 (2.7%)</p>
                     </c>
                     <c ca="left">
                        <p>32 (1.9%)</p>
                     </c>
                     <c ca="left">
                        <p>74 (3.8%)</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p><it>T. pendens </it>has about 270 more protein-coding genes than the other two, but only about 150 more genes with COG hits, suggesting that 120 of the additional genes in <it>T. pendens </it>are hypothetical proteins. We compared COG categories <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> between the three crenarchaeotes to determine what categories were more prevalent in <it>T. pendens </it>compared to the other two (Table <tblr tid="T2">2</tblr>). <it>T. pendens </it>has a higher number of genes in many categories, suggesting that the additional genes are spread out among a number of cellular processes. The three categories with the greatest additional genes in <it>T. pendens </it>are carbohydrate metabolism and transport, cell wall/membrane/envelope biogenesis, and function unknown. The greater number of carbohydrate-associated genes is mainly due to a larger number of transporters. <it>T. pendens </it>has more ABC transporters than the other two and a phosphotransferase (PTS) system transporter, as well as a higher number of transporters assigned to COG2814, arabinose efflux permease, which are transporters of the major facilitator superfamily. In addition, <it>T. pendens </it>has three sugar kinases of COG1070, while the other two have none. Thus <it>T. pendens </it>can probably take up and utilize a greater number of carbohydrates than the other two. The greater number of cell wall-associated genes in <it>T. pendens </it>is mainly due to a greater number of glycosyltransferases (COG0438) and nucleotide sugar metabolic enzymes. This suggests that <it>T. pendens </it>has a greater variety of sugars attached to lipids and/or proteins on the outside of the cell.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Comparison of COG categories among the three sulfur-reducing crenarchaeotes.</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>S. marinus</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>H. butylicus</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>T. pendens</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Amino acid transport and metabolism</p>
                     </c>
                     <c ca="left">
                        <p>74</p>
                     </c>
                     <c ca="left">
                        <p>75</p>
                     </c>
                     <c ca="left">
                        <p>89</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Carbohydrate transport and metabolism</p>
                     </c>
                     <c ca="left">
                        <p>72</p>
                     </c>
                     <c ca="left">
                        <p>40</p>
                     </c>
                     <c ca="left">
                        <p>108</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cell cycle control, cell division, chromosome partitioning</p>
                     </c>
                     <c ca="left">
                        <p>8</p>
                     </c>
                     <c ca="left">
                        <p>7</p>
                     </c>
                     <c ca="left">
                        <p>13</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cell motility</p>
                     </c>
                     <c ca="left">
                        <p>4</p>
                     </c>
                     <c ca="left">
                        <p>6</p>
                     </c>
                     <c ca="left">
                        <p>5</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cell wall/membrane/envelope biogenesis</p>
                     </c>
                     <c ca="left">
                        <p>23</p>
                     </c>
                     <c ca="left">
                        <p>24</p>
                     </c>
                     <c ca="left">
                        <p>47</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chromatin structure and dynamics</p>
                     </c>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="left">
                        <p>1</p>
                     </c>
                     <c ca="left">
                        <p>2</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Coenzyme transport and metabolism</p>
                     </c>
                     <c ca="left">
                        <p>53</p>
                     </c>
                     <c ca="left">
                        <p>75</p>
                     </c>
                     <c ca="left">
                        <p>51</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cytoskeleton</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c ca="left">
                        <p>1</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Defense mechanisms</p>
                     </c>
                     <c ca="left">
                        <p>17</p>
                     </c>
                     <c ca="left">
                        <p>10</p>
                     </c>
                     <c ca="left">
                        <p>22</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Energy production and conversion</p>
                     </c>
                     <c ca="left">
                        <p>92</p>
                     </c>
                     <c ca="left">
                        <p>109</p>
                     </c>
                     <c ca="left">
                        <p>119</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Extracellular structures</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Function unknown</p>
                     </c>
                     <c ca="left">
                        <p>116</p>
                     </c>
                     <c ca="left">
                        <p>113</p>
                     </c>
                     <c ca="left">
                        <p>132</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>General function prediction only</p>
                     </c>
                     <c ca="left">
                        <p>199</p>
                     </c>
                     <c ca="left">
                        <p>206</p>
                     </c>
                     <c ca="left">
                        <p>212</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Inorganic ion transport and metabolism</p>
                     </c>
                     <c ca="left">
                        <p>85</p>
                     </c>
                     <c ca="left">
                        <p>57</p>
                     </c>
                     <c ca="left">
                        <p>82</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Intracellular trafficking, secretion, and vesicular transport</p>
                     </c>
                     <c ca="left">
                        <p>12</p>
                     </c>
                     <c ca="left">
                        <p>15</p>
                     </c>
                     <c ca="left">
                        <p>15</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Lipid transport and metabolism</p>
                     </c>
                     <c ca="left">
                        <p>15</p>
                     </c>
                     <c ca="left">
                        <p>20</p>
                     </c>
                     <c ca="left">
                        <p>20</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Nuclear structure</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                     <c ca="left">
                        <p>0</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Nucleotide transport and metabolism</p>
                     </c>
                     <c ca="left">
                        <p>39</p>
                     </c>
                     <c ca="left">
                        <p>43</p>
                     </c>
                     <c ca="left">
                        <p>42</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Posttranslational modification, protein turnover, chaperones</p>
                     </c>
                     <c ca="left">
                        <p>53</p>
                     </c>
                     <c ca="left">
                        <p>56</p>
                     </c>
                     <c ca="left">
                        <p>63</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>RNA processing and modification</p>
                     </c>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="left">
                        <p>1</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Replication, recombination and repair</p>
                     </c>
                     <c ca="left">
                        <p>71</p>
                     </c>
                     <c ca="left">
                        <p>61</p>
                     </c>
                     <c ca="left">
                        <p>78</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Secondary metabolites biosynthesis, transport, and catabolism</p>
                     </c>
                     <c ca="left">
                        <p>5</p>
                     </c>
                     <c ca="left">
                        <p>9</p>
                     </c>
                     <c ca="left">
                        <p>3</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Signal transduction mechanisms</p>
                     </c>
                     <c ca="left">
                        <p>18</p>
                     </c>
                     <c ca="left">
                        <p>24</p>
                     </c>
                     <c ca="left">
                        <p>15</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transcription</p>
                     </c>
                     <c ca="left">
                        <p>60</p>
                     </c>
                     <c ca="left">
                        <p>66</p>
                     </c>
                     <c ca="left">
                        <p>73</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Translation</p>
                     </c>
                     <c ca="left">
                        <p>164</p>
                     </c>
                     <c ca="left">
                        <p>161</p>
                     </c>
                     <c ca="left">
                        <p>153</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>The <it>S. marinus </it>genome contains several protein families not found before in crenarchaeotes, and these are discussed below. <it>S. marinus </it>is the first crenarchaeote found to have an arginine decarboxylase belonging to COG1166 (Smar_0204), which includes the <it>speA </it>gene of <it>E. coli</it>. This protein family is also found in one euryarchaeote, <it>Methanosaeta thermophila</it>. Most euryarchaeota have a pyruvoyl-dependent arginine decarboxylase <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>. <it>T. pendens </it>and <it>Cenarchaeum symbiosum </it>also contain this type of enzyme. No arginine decarboxylase has been identified in other crenarchaeote genomes. Phylogenetic analysis of the <it>S. marinus </it>arginine decarboxylase (not shown) does not indicate a clear case of lateral gene transfer, and this enzyme was not identified during the search for laterally transferred genes (see below).</p>
            <p><it>S. marinus </it>contains a probable cell surface protein (Smar_0566) with 4 copies of the pfam03640 repeat, which has not been found in any other crenarchaeal genome. This repeat is present in two methanogens, Candidatus <it>Methanoregula boonei </it>and Candidatus <it>Methanosphaerula palustris</it>. It is also found in a wide variety of bacteria, but its function is unknown.</p>
            <p><it>S. marinus </it>is unique among crenarchaeotes in having a sodium ion-translocating decarboxylase for energy generation (Smar_1503-1504). It also has three putative operons containing subunits of multisubunit cation/proton antiporters, although these are likely to belong to large membrane-bound ion-translocating enzyme complexes rather than acting as cation antiporters (see below). <it>S. marinus </it>is the first crenarchaeote found to have a type I restriction-modification system (Smar_0761-0763).</p>
            <p><it>S. marinus </it>has 5 putative transposable elements. Phylogenetic analysis shows that all of them belong to family IS607 (not shown). The characterized members of this IS family contain two ORFs. In <it>S. marinus </it>one of the elements contains two ORFs while the other four contain only one ORF. In the <it>S. marinus </it>element with two ORFs, the first (Smar_0846) is truncated relative to other members of the family, and is likely to be a pseudogene, while the second (Smar_0847) is intact. The four elements with one ORF share a high degree of similarity to each other (Smar_0083, Smar_0767, Smar_1150, Smar_1546), suggesting that they have been recently duplicated. In addition, there are 14 copies of a repeated sequence of approximately 260 nucleotides, although some of the repeats are truncated at one or both ends. These repeats are likely to be miniature inverted-repeat transposable elements (MITEs) as they are flanked by inverted repeats and have similarity to a region of DNA upstream of the group of four transposase ORFs (Figure <figr fid="F1">1</figr>). MITEs have previously been identified in some archaeal genomes <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. Two ORFs are disrupted by MITEs, a protein with ABC transporter ATPase and acetyltransferase domains (Smar_0733) and a PIN domain protein (Smar_0327/0328). The presence of disrupted genes suggests that the MITEs have been active recently, although they do not appear to have had a major impact on the genome content.</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Alignment of putative miniature inverted-repeat transposable elements (MITEs) from <it>S. marinus</it></p>
               </caption>
               <text>
                  <p><b>Alignment of putative miniature inverted-repeat transposable elements (MITEs) from <it>S. marinus</it></b>. Start and end coordinates are given for each putative MITE. Below the MITEs are the upstream regions of four related transposases with start and end coordinates. The underlined sequences are the inverted repeats within the MITEs, and the boxed sequences are regions of similarity between the MITEs and the upstream regions of the transposases.</p>
               </text>
               <graphic file="1471-2164-10-145-1"/>
            </fig>
            <p>Twenty-one probable laterally transferred genes were identified using the program SIGI-HMM <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. One gene is by itself (Smar_0375), there are three pairs of genes (Smar_0568-0569, Smar_0846-0847, and Smar_1144-1145) and there is one cluster of 17 genes (Smar_1525-1541) in which 14 of the genes are predicted to be laterally transferred. Twelve of the laterally transferred genes are predicted to have come from other Crenarchaeota, six from Euryarchaeota, and the remaining three have unknown donors. Six of the 17 genes are likely to be pseudogenes, suggesting that they were transferred but then are degrading. From these findings we conclude that lateral transfer has not played a large role in shaping <it>S. marinus </it>gene content, and most if not all gene transfers have come from other archaea.</p>
         </sec>
         <sec>
            <st>
               <p>Metabolism/transport</p>
            </st>
            <p>The presence of transporters for peptides and carbohydrates suggests that both types of compounds can serve as carbon and energy sources. <it>S. marinus </it>has four ABC transporters for carbohydrates (Smar_0088-0091, Smar_0108-0111, Smar_0299-0302, Smar_1146-1149) and two for peptides (Smar_0270-0274, Smar_0342-0346). It has a carbohydrate secondary transporter of the glycoside-pentoside-hexuronide (GPH) family (Smar_0710), and it is the first crenarchaeote found to have a peptide transporter of the oligopeptide transporter (OPT) family (Smar_1400). There are no ABC transporters for amino acids, but a probable amino acid transporter of the neurotransmitter:sodium symporter (NSS) family is present (Smar_0285). The presence of secondary transporters (GPH, OPT, and NSS), which have low affinity and high capacity, suggests that there are times when <it>S. marinus </it>is exposed to high levels of nutrients, and it can conserve energy by using secondary transporters instead of ATP-dependent transporters.</p>
            <p><it>S. marinus </it>has a glycolysis pathway similar to <it>Aeropyrum pernix</it>, with ATP-dependent glucokinase (Smar_1514) and phosphofructokinase (Smar_0007). Glycogen synthase (Smar_1393) and phosphorylase (Smar_0246) are present, suggesting that the dark granules observed in <it>S. marinus </it>cells are composed of glycogen. Similar to other crenarchaeotes and thermococci, <it>S. marinus </it>has pyruvate:ferredoxin oxidoreductase (Smar_1447-1450) and ADP-forming acetyl-CoA synthase (Smar_0449, Smar_1241-1242) for ATP synthesis from pyruvate. Three other 2-ketoacid:ferredoxin oxidoreductases are present (Smar_0291-292, Smar_0997-1000, Smar_1443-1444) that are probably involved in amino acid degradation.</p>
            <p><it>S. marinus </it>is unique in Crenarchaeota in having a sodium-translocating decarboxylase. Smar_1504 and Smar_1503 encode the beta and gamma subunits (beta and delta in methylmalonyl-CoA decarboxylase). There are two possibilities for the activity of this decarboxylase (Figure <figr fid="F2">2</figr>). With Smar_1426 and Smar_1427 these genes could form a methylmalonyl-CoA decarboxylase. Smar_1426 and Smar_1504 are closely related to predicted methylmalonyl-CoA decarboxylase subunits of <it>Pyrococcus </it>species. This enzyme would be involved in catabolism of succinyl-CoA resulting from glutamate degradation via a 2-oxoacid:ferredoxin oxidoreductase (Figure <figr fid="F2">2</figr>). However, methylmalonyl-CoA mutase and epimerase were not found in the genome. The other possible function is oxaloacetate decarboxylase with Smar_0341 as the alpha subunit. This would be involved in catabolism of aspartate (Figure <figr fid="F2">2</figr>). However Smar_0341 is also related to pyruvate carboxylase B subunits of euryarchaeotes, and could interact with Smar_0140 to form this enzyme instead of or in addition to a sodium-transporting decarboxylase.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Two possible functions of the sodium ion-translocating decarboxylase of <it>S. marinus </it>in their metabolic contexts</p>
               </caption>
               <text>
                  <p><b>Two possible functions of the sodium ion-translocating decarboxylase of <it>S. marinus </it>in their metabolic contexts</b>.</p>
               </text>
               <graphic file="1471-2164-10-145-2"/>
            </fig>
            <p><it>S. marinus</it>, like the other heterotrophic crenarchaeotes <it>H. butylicus </it>and <it>T. pendens</it>, has lost almost all amino acid biosynthetic enzymes, although it has retained a few pathways for specific physiological reasons. For instance, glutamine is needed for its function as a nitrogen donor. Like the other heterotrophic crenarchaeotes, <it>S. marinus </it>can make pyrimidines but not purines. Enzymes for synthesis of several cofactors are present in <it>S. marinus</it>, in contrast to <it>T. pendens</it>, which lacks many cofactor synthesis pathways. <it>S. marinus </it>can likely synthesize riboflavin, pyridoxine, and coenzyme A, but it probably must acquire heme from the environment.</p>
         </sec>
         <sec>
            <st>
               <p>Electron transport/sulfur reduction</p>
            </st>
            <p><it>S. marinus </it>requires sulfur for growth and reduces it to sulfide <abbrgrp><abbr bid="B4">4</abbr></abbrgrp>, but it lacks homologs of proteins implicated in sulfur reduction in other organisms. It has no genes similar to sulfhydrogenases <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp> and the recently discovered NADPH:sulfur oxidoreductase <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> from <it>P. furiosus</it>. It also lacks genes with similarity to the molybdoenzymes polysulfide reductase of <it>Wolinella succinogenes </it><abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, sulfur reductase of <it>Acidianus ambivalens </it><abbrgrp><abbr bid="B17">17</abbr></abbrgrp>, sulfur reductase of <it>Aquifex aeolicus </it><abbrgrp><abbr bid="B18">18</abbr></abbrgrp>, and thiosulfate/sulfur reductase of <it>Salmonella enterica </it><abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. <it>S. marinus </it>has a gene (Smar_1055) with 56% similarity to sulfide dehydrogenase SudA subunit from <it>P. furiosus </it><abbrgrp><abbr bid="B20">20</abbr></abbrgrp>, but this gene is shorter than the <it>P. furiosus </it>gene by 120 amino acids and the beta subunit is not present in <it>S. marinus</it>. Thus, this enzyme is unlikely to be present in <it>S. marinus</it>. However <it>S. marinus </it>has three putative operons similar in composition to the <it>mbh </it>and <it>mbx </it>operons of Thermococcales (Table <tblr tid="T3">3</tblr>). These multisubunit complexes are not found in any other sequenced crenarchaeote. The <it>mbh </it>operon from <it>P. furiosus </it>encodes a membrane-bound hydrogenase that oxidizes ferredoxin <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>, while the <it>mbx </it>operon has a yet to be defined role in electron transfer. Its proposed function is the transfer of electrons from ferredoxin to NADPH coupled with proton translocation across the cell membrane <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. A similar complex present only in <it>Pyrococcus abyssi </it>(PAB1395-1401) is adjacent to formate dehydrogenase subunits and has similarity to <it>E. coli </it>hydrogenases 3 and 4. Thus, it is likely to be a formate hydrogen lyase.</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Sulfur reduction enzymes and their presence in the three sulfur-reducing heterotrophic crenarchaeotes.</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="left">
                        <p>Enzyme</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>S. marinus</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>T. pendens</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>H. butylicus</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Sulfur/polysulfide reductase (molybdoenzyme)</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>Tpen_1121-1123</p>
                     </c>
                     <c ca="center">
                        <p>Hbut_0371-0373</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Sulfhydrogenase</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Sulfide dehydrogenase</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>NADPH:sulfur oxidoreductase</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>Tpen_0143</p>
                     </c>
                     <c ca="center">
                        <p>Hbut_0802</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p><it>mbh</it>/<it>mbx</it>-related</p>
                     </c>
                     <c ca="center">
                        <p>Smar_0018-0030, Smar_0645-0657, Smar_1057-1071</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                     <c ca="center">
                        <p>-</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>The <it>S. marinus mbh</it>/<it>mbx</it>-related complexes contain a set of proteins similar to components of multisubunit cation/proton antiporters and another set with similarity to NADH:ubiquinone oxidoreductase subunits (Table <tblr tid="T4">4</tblr>). The <it>S. marinus </it>antiporter-related subunits show high similarity to each other and to the corresponding subunits of the <it>P. abyssi </it>putative formate hydrogen lyase. <it>S. marinus </it>does not have an identifiable formate dehydrogenase, so these complexes likely have a different function in <it>S. marinus</it>. The <it>S. marinus </it>and <it>P. abyssi </it>proteins form a distinct cluster separate from <it>mbh </it>and <it>mbx </it>complexes and from the related cation/proton antiporters (Figure <figr fid="F3">3</figr>). In contrast, the NADH:ubiquinone oxidoreductase-related subunits in the <it>S. marinus </it>putative operons are not closely related to each other or to the corresponding <it>P. abyssi </it>formate hydrogen lyase proteins. These findings indicate that the antiporter-related subunits form a cassette that has been duplicated in <it>S. marinus </it>and combined with NADH:ubiquinone oxidoreductase-related subunits that are divergent in sequence.</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>Subunit composition of multisubunit membrane-bound complexes from <it>Pyrococcus </it>species and <it>S. marinus</it>.</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <it>mbh</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>mbx</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>PabFHL</p>
                     </c>
                     <c ca="left">
                        <p>Smar1</p>
                     </c>
                     <c ca="left">
                        <p>Smar2</p>
                     </c>
                     <c ca="left">
                        <p>Smar3</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1863, MnhE</p>
                     </c>
                     <c ca="left">
                        <p>PF1423</p>
                     </c>
                     <c ca="left">
                        <p>PF1453</p>
                     </c>
                     <c ca="left">
                        <p>PAB1401</p>
                     </c>
                     <c ca="left">
                        <p>0027</p>
                     </c>
                     <c ca="left">
                        <p>0655</p>
                     </c>
                     <c ca="left">
                        <p>1070</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG2212, MnhF</p>
                     </c>
                     <c ca="left">
                        <p>PF1424</p>
                     </c>
                     <c ca="left">
                        <p>PF1452</p>
                     </c>
                     <c ca="left">
                        <p>PAB1398.1</p>
                     </c>
                     <c ca="left">
                        <p>0022</p>
                     </c>
                     <c ca="left">
                        <p>0650</p>
                     </c>
                     <c ca="left">
                        <p>1065</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1320, MnhG</p>
                     </c>
                     <c ca="left">
                        <p>PF1425</p>
                     </c>
                     <c ca="left">
                        <p>PF1451</p>
                     </c>
                     <c ca="left">
                        <p>PAB1398</p>
                     </c>
                     <c ca="left">
                        <p>0023</p>
                     </c>
                     <c ca="left">
                        <p>0651</p>
                     </c>
                     <c ca="left">
                        <p>1066</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1563</p>
                     </c>
                     <c ca="left">
                        <p>PF1426</p>
                     </c>
                     <c ca="left">
                        <p>PF1450</p>
                     </c>
                     <c ca="left">
                        <p>PAB1399.1</p>
                     </c>
                     <c ca="left">
                        <p>0024</p>
                     </c>
                     <c ca="left">
                        <p>0652</p>
                     </c>
                     <c ca="left">
                        <p>1067</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG2111, MnhB</p>
                     </c>
                     <c ca="left">
                        <p>PF1427 PF1428</p>
                     </c>
                     <c ca="left">
                        <p>PF1449</p>
                     </c>
                     <c ca="left">
                        <p>PAB1399</p>
                     </c>
                     <c ca="left">
                        <p>0025</p>
                     </c>
                     <c ca="left">
                        <p>0653</p>
                     </c>
                     <c ca="left">
                        <p>1068</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1006, MnhC</p>
                     </c>
                     <c ca="left">
                        <p>PF1429</p>
                     </c>
                     <c ca="left">
                        <p>PF1448</p>
                     </c>
                     <c ca="left">
                        <p>PAB1400</p>
                     </c>
                     <c ca="left">
                        <p>0026</p>
                     </c>
                     <c ca="left">
                        <p>0654</p>
                     </c>
                     <c ca="left">
                        <p>1069</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pfam00361, MnhD/nuoLMN</p>
                     </c>
                     <c ca="left">
                        <p>PF1430</p>
                     </c>
                     <c ca="left">
                        <p>PF1447</p>
                        <p>PF1446</p>
                     </c>
                     <c ca="left">
                        <p>PAB1402</p>
                        <p>PAB1392</p>
                        <p>PAB1391</p>
                     </c>
                     <c ca="left">
                        <p>0028</p>
                     </c>
                     <c ca="left">
                        <p>0645</p>
                     </c>
                     <c ca="left">
                        <p>1057</p>
                        <p>1058</p>
                        <p>1071</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>mbhI-related</p>
                     </c>
                     <c ca="left">
                        <p>PF1431</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>0029</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pfam01058, nuoB</p>
                     </c>
                     <c ca="left">
                        <p>PF1432</p>
                     </c>
                     <c ca="left">
                        <p>PF1444</p>
                     </c>
                     <c ca="left">
                        <p>PAB1396</p>
                     </c>
                     <c ca="left">
                        <p>0018</p>
                     </c>
                     <c ca="left">
                        <p>0646</p>
                     </c>
                     <c ca="left">
                        <p>1063</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pfam00329, nuoC</p>
                     </c>
                     <c ca="left">
                        <p>PF1433</p>
                     </c>
                     <c ca="left">
                        <p>PF1443</p>
                     </c>
                     <c ca="left">
                        <p>PAB1394</p>
                     </c>
                     <c ca="left">
                        <p>0019</p>
                     </c>
                     <c ca="left">
                        <p>0647</p>
                     </c>
                     <c ca="left">
                        <p>1061</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pfam00346, nuoD</p>
                     </c>
                     <c ca="left">
                        <p>PF1434</p>
                     </c>
                     <c ca="left">
                        <p>PF1442</p>
                     </c>
                     <c ca="left">
                        <p>PAB1394</p>
                     </c>
                     <c ca="left">
                        <p>0020</p>
                     </c>
                     <c ca="left">
                        <p>0648</p>
                     </c>
                     <c ca="left">
                        <p>1061</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Pfam00146, nuoH</p>
                     </c>
                     <c ca="left">
                        <p>PF1435</p>
                     </c>
                     <c ca="left">
                        <p>PF1445</p>
                     </c>
                     <c ca="left">
                        <p>PAB1393</p>
                     </c>
                     <c ca="left">
                        <p>0030</p>
                     </c>
                     <c ca="left">
                        <p>0657</p>
                     </c>
                     <c ca="left">
                        <p>1060</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>COG1143, FHL6/nuoI</p>
                     </c>
                     <c ca="left">
                        <p>PF1436</p>
                     </c>
                     <c ca="left">
                        <p>PF1441</p>
                     </c>
                     <c ca="left">
                        <p>PAB1395</p>
                     </c>
                     <c ca="left">
                        <p>0021 (pseudo)</p>
                     </c>
                     <c ca="left">
                        <p>0649</p>
                     </c>
                     <c ca="left">
                        <p>1062</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Phylogenetic tree of proteins related to antiporter subunit <it>mnhE</it>/<it>mrpE</it>/<it>phaE</it></p>
               </caption>
               <text>
                  <p><b>Phylogenetic tree of proteins related to antiporter subunit <it>mnhE</it>/<it>mrpE</it>/<it>phaE</it></b>.</p>
               </text>
               <graphic file="1471-2164-10-145-3"/>
            </fig>
            <p><it>S. marinus </it>produces hydrogen when sulfur is limiting <abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. Two of the multisubunit complexes are potentially involved in hydrogen production. One set of <it>S. marinus </it>proteins (Smar_1060-Smar_1063) clusters strongly with <it>E. coli </it>hydrogenases 3 and 4 in phylogenetic trees, and may form a membrane-bound hydrogenase. Smar_0018 and Smar_0020 have similarity (61% and 39%, respectively) to subunits of <it>Methanosarcina mazei </it>ech hydrogenase subunits, and hydrogenase accessory proteins are found in their vicinity (Smar_0012-0013, Smar_0015). It is likely that at least one of these clusters is involved in hydrogen production.</p>
            <p>The other complexes may be involved in sulfur reduction either directly or indirectly. One of the clusters (Smar_1057-1071) is close on the chromosome to a pyridine nucleotide-disulfide oxidoreductase (Smar_1055). It is possible that this cluster is involved in sulfur respiration, where Smar_1055 acts as a NAD(P)H-dependent polysulfide reductase and the other ORFs are involved in the generation of NAD(P)H through a membrane-based electron transport system that oxidizes reduced ferredoxin and translocates protons across the membrane. The system would allow energy generation from an overall sulfur-dependent oxidation of peptides and amino acids and it would be similar to the <it>mbx</it>-NAD(P)H elemental sulfur oxidoreductase (NSR) system that has been described for <it>P. furiosus </it><abbrgrp><abbr bid="B15">15</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Comparison of the three sulfur-reducing crenarchaeotes</p>
            </st>
            <p>Spectral clustering was used to create protein clusters from the three anaerobic sulfur-reducing heterotrophs, and the clusters shared by all three or by pairs of the three were derived (Figure <figr fid="F4">4</figr>) and [see Additional file <supplr sid="S1">1</supplr>]. The three organisms share 571 core clusters, somewhat more than the conserved crenarchaeal core of 336 determined by Makarova et al. <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. Among the clusters conserved among the three but not found in all Crenarchaeota are the subunits of ABC transporters for sugars, peptides, and amino acids, which are required for their heterotrophic lifestyle. Also falling into this group are the ferrous iron transporter proteins FeoA and FeoB and the anaerobic form of ribonucleotide reductase, proteins which reflect their anaerobicity. <it>S. marinus </it>and <it>H. butylicus </it>have almost twice as many shared clusters (225) as either one has with <it>T. pendens </it>(119 or 126). This is due to their closer phylogenetic relationship. <it>S. marinus </it>and <it>H. butylicus </it>both belong to the order Desulfurococcales while <it>T. pendens </it>belongs to the order Thermoproteales.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Venn diagram showing genes shared between <it>S. marinus</it>, <it>H. butylicus</it>, and <it>T. pendens</it></p>
               </caption>
               <text>
                  <p><b>Venn diagram showing genes shared between <it>S. marinus</it>, <it>H. butylicus</it>, and <it>T. pendens</it></b>.</p>
               </text>
               <graphic file="1471-2164-10-145-4"/>
            </fig>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <caption>
                  <p><b>Clusters shared between two or three of the genomes <it>S. marinus</it>, <it>H. butylicus</it>, and <it>T. pendens</it></b>.</p>
               </caption>
               <text>
                  <p><b>Clusters shared between two or three of the genomes <it>S. marinus</it>, <it>H. butylicus</it>, and <it>T. pendens</it></b>. List of cluster IDs with the protein family they belong to, followed by a list of locus tags for proteins belonging to the cluster.</p>
               </text>
               <file name="1471-2164-10-145-S1.txt">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>The major difference in habitat between these three organisms is that <it>S. marinus </it>and <it>H. butylicus </it>were isolated from marine environments <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B3">3</abbr></abbrgrp> while <it>T. pendens </it>was isolated from a terrestrial solfatara <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>. Marine environments have relatively high concentrations of sodium and potassium compared to terrestrial springs, and this influences the complement of transporters encoded by the three genomes. For example, <it>S. marinus </it>and <it>H. butylicus </it>use the Trk type of potassium transporter (COG0168), which is a proton or sodium symporter, while <it>T. pendens </it>uses the more energy-intensive ATP-dependent kdp-type potassium transporter (COG2060, COG2216, COG2156). Also, <it>S. marinus </it>and <it>H. butylicus </it>have a greater number and variety of sodium symporters than <it>T. pendens</it>. They both have sodium-dependent multidrug efflux pumps of the MATE family (COG0534) and amino acid transporters of the neurotransmitter:sodium symporter family (pfam00209), while only <it>S. marinus </it>has a transporter of the sodium:solute symporter family (pfam00474).</p>
            <p>Both <it>T. pendens </it>and <it>H. butylicus </it>have formate dehydrogenases while <it>S. marinus </it>lacks this enzyme. Formate can be used as an electron donor with sulfur as electron acceptor to generate energy. <it>S. marinus </it>also lacks the FdhE protein, which is involved in formate dehydrogenase formation, while the other two have it.</p>
            <p>There are also differences in the ability to utilize carbohydrates among the three organisms. As discussed above, <it>T. pendens </it>has a greater number of carbohydrate transporters than the other two. According to the CAZy database <url>http://www.cazy.org</url><abbrgrp><abbr bid="B23">23</abbr></abbrgrp>, <it>H. butylicus </it>has no glycosyl hydrolases, while <it>S. marinus </it>has ten and <it>T. pendens </it>has fifteen. Also <it>H. butylicus </it>apparently does not store glycogen as it lacks glycogen synthase and phosphorylase, but the other two have these. <it>H. butylicus </it>also lacks enzymes for utilization of galactose and N-acetylglucosamine. Surprisingly while <it>S. marinus </it>and <it>T. pendens </it>have probable glucokinases related to the characterized <it>Aeropyrum pernix </it>enzyme <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>, <it>H. butylicus </it>has a protein related to the broad-specificity hexokinase from <it>Sulfolobus tokodaii </it><abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. This suggests that, while it may not be able to break down polysaccharides, it may be able to utilize simple sugars.</p>
            <p>There are similarities and differences among the three genomes in the genes involved in biosynthesis. Many of the genes shared by <it>S. marinus </it>and <it>H. butylicus </it>but missing from <it>T. pendens </it>are involved in cofactor metabolism. <it>T. pendens </it>appears to be unable to make riboflavin, coenzyme A, pyridoxine, and possibly other cofactors, and it has transporters for biotin and riboflavin that are not found in the other two. Among the three organisms only <it>H. butylicus </it>has a heme biosynthesis pathway. On the other hand, all three organisms are unable to make most amino acids and purines, although they do have the pyrimidine biosynthetic pathway. <it>S. marinus </it>and <it>H. butylicus </it>have ABC transporters of the basic membrane protein family (pfam02608) that probably transport nucleosides <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>, but <it>T. pendens </it>lacks this type of transporter. In fact <it>T. pendens </it>does not have any identifiable nucleoside or nucleobase transporters, so it likely has undiscovered families to transport these compounds.</p>
            <p>There are other differences between these three organisms that do not directly reflect the habitats they live in. <it>H. butylicus </it>is surprisingly lacking some enzymes of central metabolism. It has no identifiable fructose-bisphosphate aldolase and no phosphoenolpyruvate synthase or pyruvate phosphate dikinase. Since fructose-bisphosphate aldolase is essential for hexose and pentose synthesis, it likely has a new version of this enzyme. <it>H. butylicus </it>also does not have an asparaginyl-tRNA synthetase; however, it is the only one of the three to have an Asp-tRNA(Asn)/Glu-tRNA(Gln) amidotransferase, but the A subunit of this enzyme (Hbut_0594) has a frameshift. Since this appears to be an essential enzyme for <it>H. butylicus</it>, the gene may still be functional.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>The crenarchaeotes <it>H. butylicus</it>, <it>S. marinus</it>, and <it>T. pendens </it>are similar phenotypically in that they all degrade peptides and/or carbohydrates using 2-oxoacid:ferredoxin oxidoreductases, they are anaerobes, and they are dependent on sulfur reduction to dispose of electrons. They all have genomes in the size range of 1.6&#8211;1.8 Mbp. Having these three genome sequences allows comparative studies to determine whether their phenotypic similarity is reflected in their genome sequences.</p>
         <p>While the central metabolic pathways for generation of ATP from peptides appear to be similar between the three, there are also differences. For instance there are different sets of transporters used by the marine organisms versus the terrestrial one. However the biggest differences between the three relate to the availability of nutrients. On one extreme is <it>H. butylicus</it>, which has no glycosidases and is capable of synthesizing most if not all cofactors it needs. This organism appears to be more specialized than the other two in that it is restricted to the use of peptides and amino acids as energy sources, although formate can also be utilized. On the other extreme is <it>T. pendens </it>which has many glycosidases and relies on its environment for most cofactors, thus it is used to being in a nutrient-rich environment. Probably a terrestrial solfatara environment allows nutrients to be concentrated as compared to marine environments in which nutrients may be quickly dispersed. <it>S. marinus </it>falls in the middle ground as it has several glycosidases like <it>T. pendens </it>but it encodes most cofactor biosynthesis pathways like <it>H. butylicus</it>. Its use of secondary transporters and ABC transporters suggests that at least at some times it is exposed to high levels of nutrients. It is adapted to an environment that contains carbohydrates as well as proteinaceous substrates, but in which cofactors are not present at high levels.</p>
         <p>Characterized membrane-bound sulfur and polysulfide reductases have three subunits <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr><abbr bid="B19">19</abbr></abbrgrp>. The A and B subunits are related in sequence, but the C subunits belong to different protein families. <it>T. pendens </it>and <it>H. butylicus </it>have putative three-subunit sulfur reductases in which all subunits are adjacent on the chromosome. These complexes have the standard A and B subunits, but they differ in their C subunits. The <it>T. pendens </it>C subunit belongs to the same family as the <it>W. succinogenes psrC </it>subunit, while the <it>H. butylicus </it>C subunit is related to <it>sreC </it>of <it>Acidianus ambivalens</it>. <it>S. marinus </it>lacks this type of sulfur or polysulfide reductase, and it is the only crenarchaeote other than <it>C. symbiosum </it>to lack this family of molybdopterin oxidoreductases (COG0243).</p>
         <p><it>T. pendens </it>and <it>H. butylicus </it>also have putative NADPH:sulfur oxidoreductases similar to the <it>P. furiosus </it>enzyme <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>, which is also absent in <it>S. marinus</it>. However, <it>S. marinus </it>has three <it>mbh</it>/<it>mbx</it>-related multisubunit complexes, which are not found in the other two genomes. The overall picture of sulfur reduction shows that <it>T. pendens </it>and <it>H. butylicus </it>may use similar pathways, while <it>S. marinus </it>uses different ones. This is in contrast to the phylogenetic positions of these organisms: <it>S. marinus </it>and <it>H. butylicus </it>belong to the order Desulfurococcales, while <it>T. pendens </it>belongs to the order Thermoproteales. The molybdoenzymes are widespread within Crenarchaeota, missing only in <it>S. marinus</it>, and may represent the ancestral path for sulfur reduction in Crenarchaeota. This analysis, however, rests on comparison to sulfur reduction enzymes characterized in other organisms, and new sulfur reduction pathways may be identified in the future.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>The three heterotrophic sulfur-reducing crenarchaeotes have adapted to their habitats, terrestrial vs. marine, via their transporter content, and they have also adapted to environments with differing levels of nutrients, with <it>T. pendens </it>being adapted to a nutrient-rich environment and <it>H. butylicus </it>adapted to an environment in which only peptides are present. <it>S. marinus </it>appears to have different electron transport pathways compared to the phenotypically similar organisms <it>T. pendens </it>and <it>H. butylicus</it>, showing that this phenotype is not encoded by the same genotype in these organisms.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <p><it>S. marinus </it>strain F1 is available from the Deutsche Sammlung von Mikroorganismen und Zellkulturen (DSMZ) as DSM 3639<sup>T </sup>and from the American Type Culture Collection (ATCC) as ATCC 43588. <it>T. pendens </it>Hrk5 is available from DSMZ as DSM 2475, and <it>H. butylicus </it>is available from DSMZ as DSM 5456. <it>S. marinus </it>F1 cells were grown in a 300 liter fermenter at 85&#176;C in SME medium with 0.1% yeast extract, 0.1% peptone, and 0.7% elemental sulfur under a 200 kPa N<sub>2 </sub>atmosphere. Cells grew to a density of 3 &#215; 10<sup>8 </sup>cells/ml in 3 days. Cell pellets were stored at -85&#176;C. DNA was extracted based on the method of Zhou et al. <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. One gram of cells was dissolved in 4.5 ml extraction buffer (100 mM Tris, pH 8.0, 100 mM EDTA, 100 mM sodium phosphate, and 1.5 M NaCl). After 200 micrograms of proteinase K were added, cells were incubated for 30 minutes at 37&#176;C. A solution of 0.5 ml 20% SDS was added, and then the mixture was incubated at 65&#176;C for 2 hours. Proteins were removed by extraction with 5 ml phenol. The sample was centrifuged for 30 minutes at 19000 rpm in a Sorvall SS34 rotor at 10&#176;C, and the upper phase was discarded. The sample was then extracted twice with chloroform and isoamyl alcohol (24:1) to remove phenol. DNA was precipitated with 3 ml isopropanol at room temperature overnight. The sample was then centrifuged for 30 minutes. The pellet was washed with 5 ml 70% ethanol and recentrifuged. The pellet was dried and then dissolved in 1 ml LiChrosolv (Merck, Darmstadt, Germany). RNA was removed by addition of 20 &#956;g DNAse-free RNAse and incubation for 4 hours at 37&#176;C.</p>
         <p>The genome of <it>S. marinus </it>was sequenced at the Joint Genome Institute (JGI) using a combination of 3 kb, 8&#8211;10 kb and 40 kb (fosmid) DNA libraries. For all three libraries, shearing is followed by blunt end repair; then the DNA is isolated on an agarose gel and the appropriate section of the gel is cut out. For fosmid libraries, DNA is separated on a pulsed-field gel. DNA is extracted from the gel and then cloned into the pUC18 vector for 3 kb libraries, the pMCL200 vector for 8&#8211;10 kb libraries, or the pCC1FOS vector for 40 kb fosmid libraries. Sequencing is carried out from both ends of the inserts using BigDye Terminators and ABI3730XL DNA sequencers. More detailed information about library construction and sequencing, including protocols and reagents, is available at <url>http://www.jgi.doe.gov/sequencing/protocols/prots_production.html</url>. Draft assemblies were based on 23766 total reads. All three libraries provided 13.3&#215; coverage of the genome. The Phred/Phrap/Consed software package <url>http://www.phrap.com</url> was used for sequence assembly and quality assessment <abbrgrp><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr></abbrgrp>. All mis-assemblies were corrected and all gaps between contigs were closed by custom primer walk using subclones or PCR products as templates. A total of 657 additional reactions were necessary to close gaps and to raise the quality of the finished sequence. The Phred quality score for this genome is Q50, which corresponds to one miscalled base per 100,000 bases. The genome sequence of <it>S. marinus </it>can be accessed in GenBank [GenBank: <ext-link ext-link-type="gen" ext-link-id="CP000575">CP000575</ext-link>]. The Genomes On Line Database (GOLD) accession number is <url>http://genomesonline.org/GOLD_CARDS/Gc00511.html</url>. Genes were identified using a combination of Critica <abbrgrp><abbr bid="B31">31</abbr></abbrgrp> and Glimmer <abbrgrp><abbr bid="B32">32</abbr></abbrgrp> followed by a round of manual curation.</p>
         <p>Analysis of the <it>S. marinus </it>genome was carried out with the Integrated Microbial Genomes (IMG) system <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. Proteins unique to <it>S. marinus </it>or missing from <it>S. marinus </it>but present in other crenarchaeotes were identified with the phylogenetic profiler in IMG. Transposable elements were identified by BLAST against the ISFinder database <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. CRISPR repeats were identified with the CRISPR Recognition Tool <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>.</p>
         <p>Laterally transferred genes were identified with SIGI-HMM <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. DNA and protein alignments were generated with CLUSTAL W <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. The phylogenetic tree was generated with MrBayes 3.1.2 <abbrgrp><abbr bid="B37">37</abbr></abbrgrp> with 1,000,000 generations sampled every 100 generations. The first 250,000 generations were discarded as burn-in. The tree was viewed and manipulated with njplot <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>.</p>
         <p>To generate clusters for comparative genomics, we retrieved all amino acid sequences for <it>S. marinus</it>, <it>H. butylicus</it>, and <it>T. pendens </it>along with their blastp <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> (e-value &lt; 10-6) similarity scores, from the Integrated Microbial Genomes database <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. Thereafter, we divided the resulting network of protein similarities into distinct similarity matrices. Each matrix (cluster of proteins) was then successively partitioned into two child clusters using a spectral clustering procedure <abbrgrp><abbr bid="B40">40</abbr><abbr bid="B41">41</abbr></abbrgrp>. This procedure is analogous to a random walk of a particle moving over the proteins of the network. At each transition, the particle moves to an adjacent protein with probabilities corresponding to the similarity between proteins. The amount of time the particle spends in a given sub-network will determine whether this is indeed a cluster of its own or not. The magnitude of the second eigenvalue of the similarity matrix for a network will determine how fast the particle approaches its stationary distribution <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>. Here, we chose to partition the network if the second eigenvalue was 0.8 or more. This approach resulted in 1041 clusters of a total of 2653 proteins with homologs within two or more of the organisms.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>HH isolated the DNA, SL and AC carried out the sequencing and assembly, HS and AL finished the genome, ML carried out gene calling and annotation. IA, LD, JR, IP, LEU, SH, JGE, KM, and BM contributed to the analysis. IA compiled the manuscript. HH, IBZ, WBW, BM, CW, JB, and NK supervised aspects of the project and critically reviewed the manuscript. All authors approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>This work was performed under the auspices of the US Department of Energy's Office of Science, Biological and Environmental Research Program, and by the University of California, Lawrence Berkeley National Laboratory under contract No. DE-AC02-05CH11231, Lawrence Livermore National Laboratory under Contract No. DE-AC52-07NA27344, and Los Alamos National Laboratory under contract No. DE-AC02-06NA25396. L. D., J. R., and B. M. were supported by a NASA Astrobiology: Exobiology and Evolutionary Biology grant NNG05GP24G to B. M. I. P. and W. B. W. were supported by DOE contract number DE-FG02-97ER20269. L. E. U. and I. B. Z. were supported by grant number GM72285 from the National Institutes of Health. J. G. E. was supported by the DOE Genomes to Life program. M. L. was supported by the Department of Energy under contract DE-AC05-000R22725.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p><it>Hyperthermus butylicus</it>, a hyperthermophilic sulfur-reducing archaebacterium that ferments peptides</p>
            </title>
            <aug>
               <au>
                  <snm>Zillig</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Holz</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Janekovic</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Klenk</snm>
                  <fnm>H-P</fnm>
               </au>
               <au>
                  <snm>Imsel</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Trent</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wunderl</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Forjaz</snm>
                  <fnm>VH</fnm>
               </au>
               <au>
                  <snm>Coutinho</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ferreira</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1990</pubdate>
            <volume>172</volume>
            <fpage>3959</fpage>
            <lpage>3965</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">213380</pubid>
                  <pubid idtype="pmpid" link="fulltext">2113915</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The archaebacterium <it>Thermofilum pendens </it>represents, a novel genus of the thermophilic, anaerobic sulfur respiring <it>Thermoproteales</it></p>
            </title>
            <aug>
               <au>
                  <snm>Zillig</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Gierl</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Schreiber</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wunderl</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Janekovic</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Stetter</snm>
                  <fnm>KO</fnm>
               </au>
               <au>
                  <snm>Klenk</snm>
                  <fnm>H-P</fnm>
               </au>
            </aug>
            <source>Syst Appl Microbiol</source>
            <pubdate>1983</pubdate>
            <volume>4</volume>
            <fpage>79</fpage>
            <lpage>87</lpage>
         </bibl>
         <bibl id="B3">
            <title>
               <p><it>Staphylothermus marinus </it>sp. nov. represents a novel genus of extremely thermophilic submarine heterotrophic archaebacteria growing up to 98&#176;C</p>
            </title>
            <aug>
               <au>
                  <snm>Fiala</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Stetter</snm>
                  <fnm>KO</fnm>
               </au>
               <au>
                  <snm>Jannasch</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>Langworthy</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Madon</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Syst Appl Microbiol</source>
            <pubdate>1986</pubdate>
            <volume>8</volume>
            <fpage>106</fpage>
            <lpage>113</lpage>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Minimal sulfur requirement for growth and sulfur-dependent metabolism of the hyperthermophilic archaeon <it>Staphylothermus marinus</it></p>
            </title>
            <aug>
               <au>
                  <snm>Hao</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Archaea</source>
            <pubdate>2003</pubdate>
            <volume>1</volume>
            <fpage>191</fpage>
            <lpage>197</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15803665</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Tetrabrachion: a filamentous archaebacterial surface protein assembly of unusual structure and extreme stability</p>
            </title>
            <aug>
               <au>
                  <snm>Peters</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Nitsch</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>K&#252;hlmorgen</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Golbik</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Lupas</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kellermann</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Engelhardt</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Pfander</snm>
                  <fnm>J-P</fnm>
               </au>
               <au>
                  <snm>M&#252;ller</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Goldie</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Engel</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Stetter</snm>
                  <fnm>K-O</fnm>
               </au>
               <au>
                  <snm>Baumeister</snm>
                  <fnm>W</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1995</pubdate>
            <volume>245</volume>
            <fpage>385</fpage>
            <lpage>401</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/jmbi.1994.0032</pubid>
                  <pubid idtype="pmpid" link="fulltext">7837271</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Novel molecular architecture of the multimeric archaeal PEP-synthase homologue (MAPS) from <it>Staphylothermus marinus</it></p>
            </title>
            <aug>
               <au>
                  <snm>Cicicopol</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Peter</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lupas</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cejka</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>M&#252;ller</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Golbik</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Pfeifer</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Lilie</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Engel</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Baumeister</snm>
                  <fnm>W</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1999</pubdate>
            <volume>290</volume>
            <fpage>347</fpage>
            <lpage>361</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/jmbi.1999.2878</pubid>
                  <pubid idtype="pmpid" link="fulltext">10388577</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>The genome of <it>Hyperthermus butylicus</it>: a sulfur-reducing, peptide fermenting, neutrophilic Crenarchaeote growing up to 108 degrees C</p>
            </title>
            <aug>
               <au>
                  <snm>Br&#252;gger</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Stark</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Zibat</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Redder</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ruepp</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Awayez</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>She</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Garrett</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Klenk</snm>
                  <fnm>H-P</fnm>
               </au>
            </aug>
            <source>Archaea</source>
            <pubdate>2007</pubdate>
            <volume>2</volume>
            <issue>2</issue>
            <fpage>127</fpage>
            <lpage>135</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17350933</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Genome sequence of <it>Thermofilum pendens </it>reveals an exceptional loss of biosynthetic pathways without genome reduction</p>
            </title>
            <aug>
               <au>
                  <snm>Anderson</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Rodriguez</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Susanti</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Porat</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Reich</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ulrich</snm>
                  <fnm>LE</fnm>
               </au>
               <au>
                  <snm>Elkins</snm>
                  <fnm>JG</fnm>
               </au>
               <au>
                  <snm>Mavromatis</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Lykidis</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Thompson</snm>
                  <fnm>LS</fnm>
               </au>
               <au>
                  <snm>Nolan</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Land</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Copeland</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lapidus</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lucas</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Detter</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Zhulin</snm>
                  <fnm>IB</fnm>
               </au>
               <au>
                  <snm>Olsen</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>Whitman</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Mukhopadhyay</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Bristow</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kyrpides</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2008</pubdate>
            <volume>190</volume>
            <fpage>2957</fpage>
            <lpage>2965</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2293246</pubid>
                  <pubid idtype="pmpid" link="fulltext">18263724</pubid>
                  <pubid idtype="doi">10.1128/JB.01949-07</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>The COG database: an updated version includes eukaryotes</p>
            </title>
            <aug>
               <au>
                  <snm>Tatusov</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Fedorova</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Jackson</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Jacobs</snm>
                  <fnm>AR</fnm>
               </au>
               <au>
                  <snm>Kiryutin</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
               <au>
                  <snm>Krylov</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Mazumder</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Mekhedov</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Nikolskaya</snm>
                  <fnm>AN</fnm>
               </au>
               <au>
                  <snm>Rao</snm>
                  <fnm>BS</fnm>
               </au>
               <au>
                  <snm>Smirnov</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sverdlov</snm>
                  <fnm>AV</fnm>
               </au>
               <au>
                  <snm>Vasudevan</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wolf</snm>
                  <fnm>YI</fnm>
               </au>
               <au>
                  <snm>Yin</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Natale</snm>
                  <fnm>DA</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>4</volume>
            <fpage>41</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">222959</pubid>
                  <pubid idtype="pmpid" link="fulltext">12969510</pubid>
                  <pubid idtype="doi">10.1186/1471-2105-4-41</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p><it>Methanococcus jannaschii </it>uses a pyruvoyl-dependent arginine decarboxylase in polyamine biosynthesis</p>
            </title>
            <aug>
               <au>
                  <snm>Graham</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>RH</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2002</pubdate>
            <volume>277</volume>
            <fpage>23500</fpage>
            <lpage>23507</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.M203467200</pubid>
                  <pubid idtype="pmpid" link="fulltext">11980912</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Insertion sequence diversity in archaea</p>
            </title>
            <aug>
               <au>
                  <snm>Fil&#233;e</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Siguier</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Chandler</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Microbiol Mol Biol Rev</source>
            <pubdate>2007</pubdate>
            <volume>71</volume>
            <fpage>121</fpage>
            <lpage>157</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1847376</pubid>
                  <pubid idtype="pmpid" link="fulltext">17347521</pubid>
                  <pubid idtype="doi">10.1128/MMBR.00031-06</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Score-based prediction of genomic islands in prokaryotic genomes using hidden Markov models</p>
            </title>
            <aug>
               <au>
                  <snm>Waack</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Keller</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Asper</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Brodag</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Damm</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Fricke</snm>
                  <fnm>WF</fnm>
               </au>
               <au>
                  <snm>Surovcik</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Meinicke</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Merkl</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>142</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1489950</pubid>
                  <pubid idtype="pmpid" link="fulltext">16542435</pubid>
                  <pubid idtype="doi">10.1186/1471-2105-7-142</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Hydrogenase of the hyperthermophile <it>Pyrococcus furiosus </it>is an elemental sulfur reductase or sulfhydrogenase: evidence for a sulfur-reducing hydrogenase ancestor</p>
            </title>
            <aug>
               <au>
                  <snm>Ma</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Schicho</snm>
                  <fnm>RN</fnm>
               </au>
               <au>
                  <snm>Kelly</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MWW</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1993</pubdate>
            <volume>90</volume>
            <fpage>5341</fpage>
            <lpage>5344</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">46712</pubid>
                  <pubid idtype="pmpid">8389482</pubid>
                  <pubid idtype="doi">10.1073/pnas.90.11.5341</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Characterization of hydrogenase II from the hyperthermophilic archaeon <it>Pyrococcus furiosus </it>and assessment of its role in sulfur reduction</p>
            </title>
            <aug>
               <au>
                  <snm>Ma</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Weiss</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MWW</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2000</pubdate>
            <volume>182</volume>
            <fpage>1864</fpage>
            <lpage>1871</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">101868</pubid>
                  <pubid idtype="pmpid" link="fulltext">10714990</pubid>
                  <pubid idtype="doi">10.1128/JB.182.7.1864-1871.2000</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Insights into the metabolism of elemental sulfur by the hyperthermophilic archaeon <it>Pyrococcus furiosus</it>: characterization of a coenzyme A-dependent NAD(P)H sulfur oxidoreductase</p>
            </title>
            <aug>
               <au>
                  <snm>Schut</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>Bridger</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MWW</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2007</pubdate>
            <volume>189</volume>
            <fpage>4431</fpage>
            <lpage>4441</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1913366</pubid>
                  <pubid idtype="pmpid" link="fulltext">17449625</pubid>
                  <pubid idtype="doi">10.1128/JB.00031-07</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Cloning and nucleotide sequence of the <it>psrA </it>gene of <it>Wolinella succinogenes </it>polysulphide reductase</p>
            </title>
            <aug>
               <au>
                  <snm>Krafft</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Bokranz</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Klimmek</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Schr&#246;der</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Fahrenholz</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Kojro</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Kr&#246;ger</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Eur J Biochem</source>
            <pubdate>1992</pubdate>
            <volume>206</volume>
            <fpage>503</fpage>
            <lpage>510</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1432-1033.1992.tb16953.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">1597189</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Membrane-bound hydrogenase and sulfur reductase of the hyperthermophilic and acidophilic archaeon <it>Acidianus ambivalens</it></p>
            </title>
            <aug>
               <au>
                  <snm>Laska</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lottspeich</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Kletzin</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Microbiology</source>
            <pubdate>2003</pubdate>
            <volume>149</volume>
            <fpage>2357</fpage>
            <lpage>2371</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1099/mic.0.26455-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">12949162</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>A membrane-bound multienzyme, hydrogen-oxidizing, and sulfur-reducing complex from the hyperthermophilic bacterium <it>Aquifex aeolicus</it></p>
            </title>
            <aug>
               <au>
                  <snm>Guiral</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Tron</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Aubert</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Gloter</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Iobbi-Nivol</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Giudici-Orticoni</snm>
                  <fnm>M-T</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2005</pubdate>
            <volume>280</volume>
            <fpage>42004</fpage>
            <lpage>42015</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.M508034200</pubid>
                  <pubid idtype="pmpid" link="fulltext">16236714</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Specificity of respiratory pathways involved in the reduction of sulfur compounds by <it>Salmonella enterica</it></p>
            </title>
            <aug>
               <au>
                  <snm>Hinsley</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Berks</snm>
                  <fnm>BC</fnm>
               </au>
            </aug>
            <source>Microbiology</source>
            <pubdate>2002</pubdate>
            <volume>148</volume>
            <fpage>3631</fpage>
            <lpage>3638</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12427953</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Sulfide dehydrogenase from the hyperthermophilic archaeon <it>Pyrococcus furiosus</it>: a new multifunctional enzyme involved in the reduction of elemental sulfur</p>
            </title>
            <aug>
               <au>
                  <snm>Ma</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MWW</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1994</pubdate>
            <volume>176</volume>
            <fpage>6509</fpage>
            <lpage>6517</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">197004</pubid>
                  <pubid idtype="pmpid" link="fulltext">7961401</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Purification and characterization of a membrane-bound hydrogenase from the hyperthermophilic archaeon <it>Pyrococcus furiosus</it></p>
            </title>
            <aug>
               <au>
                  <snm>Sapra</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Verhagen</snm>
                  <fnm>MF</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MWW</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2000</pubdate>
            <volume>182</volume>
            <fpage>3423</fpage>
            <lpage>3428</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">101913</pubid>
                  <pubid idtype="pmpid" link="fulltext">10852873</pubid>
                  <pubid idtype="doi">10.1128/JB.182.12.3423-3428.2000</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Clusters of orthologous genes for 41 archaeal genomes and implications for the evolutionary genomics of archaea</p>
            </title>
            <aug>
               <au>
                  <snm>Makarova</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Sorokin</snm>
                  <fnm>AV</fnm>
               </au>
               <au>
                  <snm>Novichkov</snm>
                  <fnm>PS</fnm>
               </au>
               <au>
                  <snm>Wolf</snm>
                  <fnm>YI</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
            </aug>
            <source>Biol Direct</source>
            <pubdate>2007</pubdate>
            <volume>2</volume>
            <fpage>33</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2222616</pubid>
                  <pubid idtype="pmpid" link="fulltext">18042280</pubid>
                  <pubid idtype="doi">10.1186/1745-6150-2-33</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>The Carbohydrate-Active EnZymes database (CAZy): an expert resource for Glycogenomics</p>
            </title>
            <aug>
               <au>
                  <snm>Cantarel</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Coutinho</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Rancurel</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Bernard</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lombard</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Henrissat</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2009</pubdate>
            <volume>37</volume>
            <fpage>D233</fpage>
            <lpage>D238</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/nar/gkn663</pubid>
                  <pubid idtype="pmpid" link="fulltext">18838391</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Cloning, expression, and characterization of the first archaeal ATP-dependent glucokinase from aerobic hyperthermophilic archaeon <it>Aeropyrum pernix</it></p>
            </title>
            <aug>
               <au>
                  <snm>Sakuraba</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Mitani</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Goda</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kawarabayasi</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Ohshima</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>J Biochem</source>
            <pubdate>2003</pubdate>
            <volume>133</volume>
            <fpage>219</fpage>
            <lpage>224</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/jb/mvg027</pubid>
                  <pubid idtype="pmpid" link="fulltext">12761185</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Identification and characterization of an ATP-dependent hexokinase with broad substrate specificity from the hyperthermophilic archaeon <it>Sulfolobus tokodaii</it></p>
            </title>
            <aug>
               <au>
                  <snm>Nishimasu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Fushinobu</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Shoun</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wakagi</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2006</pubdate>
            <volume>188</volume>
            <fpage>2014</fpage>
            <lpage>2019</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1426560</pubid>
                  <pubid idtype="pmpid" link="fulltext">16484213</pubid>
                  <pubid idtype="doi">10.1128/JB.188.5.2014-2019.2006</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>A member of the second carbohydrate uptake family of ATP-binding cassette transporters is responsible for ribonucleoside uptake in <it>Streptococcus mutans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Webb</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Hosie</snm>
                  <fnm>AH</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2006</pubdate>
            <volume>188</volume>
            <fpage>8005</fpage>
            <lpage>8012</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1698198</pubid>
                  <pubid idtype="pmpid" link="fulltext">16997965</pubid>
                  <pubid idtype="doi">10.1128/JB.01101-06</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>DNA recovery from soils of diverse composition</p>
            </title>
            <aug>
               <au>
                  <snm>Zhou</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bruns</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Tiedje</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>1996</pubdate>
            <volume>62</volume>
            <fpage>316</fpage>
            <lpage>322</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">167800</pubid>
                  <pubid idtype="pmpid" link="fulltext">8593035</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Base-calling of automated sequencer traces using phred. II. Error probabilities</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>186</fpage>
            <lpage>194</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521922</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Base-calling of automated sequencer traces using phred. I. Accuracy assessment</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wendl</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>175</fpage>
            <lpage>185</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521921</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Consed: a graphical tool for sequence finishing</p>
            </title>
            <aug>
               <au>
                  <snm>Gordon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Abajian</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>195</fpage>
            <lpage>202</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521923</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>CRITICA: coding region identification tool invoking comparative analysis</p>
            </title>
            <aug>
               <au>
                  <snm>Badger</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Olsen</snm>
                  <fnm>GJ</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1999</pubdate>
            <volume>16</volume>
            <fpage>512</fpage>
            <lpage>524</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10331277</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Improved microbial gene identification with GLIMMER</p>
            </title>
            <aug>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Harmon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kasif</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1999</pubdate>
            <volume>27</volume>
            <fpage>4636</fpage>
            <lpage>4641</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">148753</pubid>
                  <pubid idtype="pmpid" link="fulltext">10556321</pubid>
                  <pubid idtype="doi">10.1093/nar/27.23.4636</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>The integrated microbial genomes (IMG) system in 2007: data content and analysis tool extensions</p>
            </title>
            <aug>
               <au>
                  <snm>Markowitz</snm>
                  <fnm>VM</fnm>
               </au>
               <au>
                  <snm>Szeto</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Palaniappan</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Grechkin</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Chu</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>I-MA</fnm>
               </au>
               <au>
                  <snm>Dubchak</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Anderson</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Lykidis</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mavromatis</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ivanova</snm>
                  <fnm>NN</fnm>
               </au>
               <au>
                  <snm>Kyrpides</snm>
                  <fnm>NC</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2008</pubdate>
            <volume>36</volume>
            <fpage>D528</fpage>
            <lpage>D533</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2238897</pubid>
                  <pubid idtype="pmpid" link="fulltext">17933782</pubid>
                  <pubid idtype="doi">10.1093/nar/gkm846</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>ISfinder: the reference centre for bacterial insertion sequences</p>
            </title>
            <aug>
               <au>
                  <snm>Siguier</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Perochon</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lestrade</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Mahillon</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chandler</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>D32</fpage>
            <lpage>D36</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1347377</pubid>
                  <pubid idtype="pmpid" link="fulltext">16381877</pubid>
                  <pubid idtype="doi">10.1093/nar/gkj014</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>CRISPR recognition tool (CRT): a tool for automatic detection of clustered regularly interspaced palindromic repeats</p>
            </title>
            <aug>
               <au>
                  <snm>Bland</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ramsey</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Sabree</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Lowe</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kyrpides</snm>
                  <fnm>NC</fnm>
               </au>
               <au>
                  <snm>Hugenholtz</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2007</pubdate>
            <volume>8</volume>
            <fpage>209</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1924867</pubid>
                  <pubid idtype="pmpid" link="fulltext">17577412</pubid>
                  <pubid idtype="doi">10.1186/1471-2105-8-209</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>CLUSTAL W: improving the sensitivity of progressive multiple sequence alignment through sequence weighting, position-specific gap penalties and weight matrix choice</p>
            </title>
            <aug>
               <au>
                  <snm>Thompson</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Higgins</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Gibson</snm>
                  <fnm>TJ</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1994</pubdate>
            <volume>22</volume>
            <fpage>4673</fpage>
            <lpage>4680</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308517</pubid>
                  <pubid idtype="pmpid" link="fulltext">7984417</pubid>
                  <pubid idtype="doi">10.1093/nar/22.22.4673</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>MrBayes 3: Bayesian phylogenetic inference under mixed models</p>
            </title>
            <aug>
               <au>
                  <snm>Ronquist</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Huelsenbeck</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <fpage>1572</fpage>
            <lpage>1574</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/btg180</pubid>
                  <pubid idtype="pmpid" link="fulltext">12912839</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>WWW-query: an on-line retrieval system for biological sequence banks</p>
            </title>
            <aug>
               <au>
                  <snm>Perri&#232;re</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Gouy</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Biochimie</source>
            <pubdate>1996</pubdate>
            <volume>78</volume>
            <fpage>364</fpage>
            <lpage>369</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0300-9084(96)84768-7</pubid>
                  <pubid idtype="pmpid" link="fulltext">8905155</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Basic local alignment search tool</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Gish</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1990</pubdate>
            <volume>215</volume>
            <fpage>403</fpage>
            <lpage>410</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">2231712</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Spectral clustering of protein sequences</p>
            </title>
            <aug>
               <au>
                  <snm>Paccanaro</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Casbon</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Saqi</snm>
                  <fnm>MA</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>1571</fpage>
            <lpage>1580</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1409676</pubid>
                  <pubid idtype="pmpid" link="fulltext">16547200</pubid>
                  <pubid idtype="doi">10.1093/nar/gkj515</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Development of a spectral clustering method for the analysis of molecular data sets</p>
            </title>
            <aug>
               <au>
                  <snm>Brewer</snm>
                  <fnm>ML</fnm>
               </au>
            </aug>
            <source>J Chem Inf Model</source>
            <pubdate>2007</pubdate>
            <volume>47</volume>
            <fpage>1727</fpage>
            <lpage>1733</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1021/ci600565r</pubid>
                  <pubid idtype="pmpid" link="fulltext">17636944</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Bounds on the cover time</p>
            </title>
            <aug>
               <au>
                  <snm>Broder</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Karlin</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>J Theoret Probab</source>
            <pubdate>1989</pubdate>
            <volume>2</volume>
            <fpage>101</fpage>
            <lpage>120</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/BF01048273</pubid>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
