<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2004-5-10-r77</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>Complete genome sequence of the industrial bacterium <it>Bacillus licheniformis </it>and comparisons with closely related <it>Bacillus </it>species</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Rey</snm>
               <mi>W</mi>
               <fnm>Michael</fnm>
               <insr iid="I1"/>
               <email>mwr@novozymes.com</email>
            </au>
            <au id="A2">
               <snm>Ramaiya</snm>
               <fnm>Preethi</fnm>
               <insr iid="I1"/>
               <email>pira@novozymes.com</email>
            </au>
            <au id="A3">
               <snm>Nelson</snm>
               <mi>A</mi>
               <fnm>Beth</fnm>
               <insr iid="I1"/>
               <email>bane@novozymes.com</email>
            </au>
            <au id="A4">
               <snm>Brody-Karpin</snm>
               <mi>D</mi>
               <fnm>Shari</fnm>
               <insr iid="I1"/>
               <email>sbka@novozymes.com</email>
            </au>
            <au id="A5">
               <snm>Zaretsky</snm>
               <mi>J</mi>
               <fnm>Elizabeth</fnm>
               <insr iid="I1"/>
               <email>ejg@novozymes.com</email>
            </au>
            <au id="A6">
               <snm>Tang</snm>
               <fnm>Maria</fnm>
               <insr iid="I1"/>
               <email>mata@novozymes.com</email>
            </au>
            <au id="A7">
               <snm>de Leon</snm>
               <mnm>Lopez</mnm>
               <fnm>Alfredo</fnm>
               <insr iid="I1"/>
               <email>allo@novozymes.com</email>
            </au>
            <au id="A8">
               <snm>Xiang</snm>
               <fnm>Henry</fnm>
               <insr iid="I1"/>
               <email>hxi@novozymes.com</email>
            </au>
            <au id="A9">
               <snm>Gusti</snm>
               <fnm>Veronica</fnm>
               <insr iid="I1"/>
               <email>VGusti@coh.org</email>
            </au>
            <au id="A10">
               <snm>Clausen</snm>
               <fnm>Ib Groth</fnm>
               <insr iid="I2"/>
               <insr iid="I4"/>
               <email>Ib.GrothClausen@astrazeneca.com</email>
            </au>
            <au id="A11">
               <snm>Olsen</snm>
               <mi>B</mi>
               <fnm>Peter</fnm>
               <insr iid="I2"/>
               <email>pbo@novozymes.com</email>
            </au>
            <au id="A12">
               <snm>Rasmussen</snm>
               <mi>D</mi>
               <fnm>Michael</fnm>
               <insr iid="I2"/>
               <email>mdra@novozymes.com</email>
            </au>
            <au id="A13">
               <snm>Andersen</snm>
               <mi>T</mi>
               <fnm>Jens</fnm>
               <insr iid="I2"/>
               <email>jtan@novozymes.com</email>
            </au>
            <au id="A14">
               <snm>J&#248;rgensen</snm>
               <mi>L</mi>
               <fnm>Per</fnm>
               <insr iid="I2"/>
               <email>plj@novozymes.com</email>
            </au>
            <au id="A15">
               <snm>Larsen</snm>
               <mi>S</mi>
               <fnm>Thomas</fnm>
               <insr iid="I2"/>
               <email>thsl@novozymes.com</email>
            </au>
            <au id="A16">
               <snm>Sorokin</snm>
               <fnm>Alexei</fnm>
               <insr iid="I3"/>
               <email>sorokine@jouy.inra.fr</email>
            </au>
            <au id="A17">
               <snm>Bolotin</snm>
               <fnm>Alexander</fnm>
               <insr iid="I3"/>
               <email>bolotine@diamant.jouy.inra.fr</email>
            </au>
            <au id="A18">
               <snm>Lapidus</snm>
               <fnm>Alla</fnm>
               <insr iid="I3"/>
               <insr iid="I5"/>
               <email>alapidus@lbl.gov</email>
            </au>
            <au id="A19">
               <snm>Galleron</snm>
               <fnm>Nathalie</fnm>
               <insr iid="I3"/>
               <email>galleron@diamant.jouy.inra.fr</email>
            </au>
            <au id="A20">
               <snm>Ehrlich</snm>
               <fnm>S Dusko</fnm>
               <insr iid="I3"/>
               <email>ehrlich@diamant.jouy.inra.fr</email>
            </au>
            <au id="A21" ca="yes">
               <snm>Berka</snm>
               <mi>M</mi>
               <fnm>Randy</fnm>
               <insr iid="I1"/>
               <email>ramb@novozymes.com</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Novozymes Biotech Inc, 1445 Drew Ave, Davis, CA 95616, USA</p>
            </ins>
            <ins id="I2">
               <p>Novozymes A/S, Bagsv&#230;rd, DK-2880, Denmark</p>
            </ins>
            <ins id="I3">
               <p>Institut National de la Recherche Agronomique, Paris Cedex 75007, France</p>
            </ins>
            <ins id="I4">
               <p>AstraZeneca International, Lund SE221 87, Sweden</p>
            </ins>
            <ins id="I5">
               <p>Joint Genome Institute, Walnut Creek, CA 94598, USA</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2004</pubdate>
         <volume>5</volume>
         <issue>10</issue>
         <fpage>r77</fpage>
         <url>http://genomebiology.com/2004/5/10/R77</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">15461803</pubid>
               <pubid idtype="doi">10.1186/gb-2004-5-10-r77</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>20</day>
               <month>5</month>
               <year>2004</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>30</day>
               <month>6</month>
               <year>2004</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>3</day>
               <month>8</month>
               <year>2004</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>13</day>
               <month>9</month>
               <year>2004</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2004</year>
         <collab>Rey et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Complete genome sequence of the industrial bacterium <it>Bacillus licheniformis </it>and comparisons with closely related <it>Bacillus </it>species</p>
      </shorttitle>
      <shortabs>
         <p>The complete sequence of the <it>Bacillus licheniformis </it>ATCC 14580 genome was determined, revealing 4,208 predicted protein-coding genes, 7 rRNA operons and 72 tRNA genes.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p><it>Bacillus licheniformis </it>is a Gram-positive, spore-forming soil bacterium that is used in the biotechnology industry to manufacture enzymes, antibiotics, biochemicals and consumer products. This species is closely related to the well studied model organism <it>Bacillus subtilis</it>, and produces an assortment of extracellular enzymes that may contribute to nutrient cycling in nature.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>We determined the complete nucleotide sequence of the <it>B. licheniformis </it>ATCC 14580 genome which comprises a circular chromosome of 4,222,336 base-pairs (bp) containing 4,208 predicted protein-coding genes with an average size of 873 bp, seven rRNA operons, and 72 tRNA genes. The <it>B. licheniformis </it>chromosome contains large regions that are colinear with the genomes of <it>B. subtilis </it>and <it>Bacillus halodurans</it>, and approximately 80% of the predicted <it>B. licheniformis </it>coding sequences have <it>B. subtilis </it>orthologs.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusions</p>
               </st>
               <p>Despite the unmistakable organizational similarities between the <it>B. licheniformis </it>and <it>B. subtilis </it>genomes, there are notable differences in the numbers and locations of prophages, transposable elements and a number of extracellular enzymes and secondary metabolic pathway operons that distinguish these species. Differences include a region of more than 80 kilobases (kb) that comprises a cluster of polyketide synthase genes and a second operon of 38 kb encoding plipastatin synthase enzymes that are absent in the <it>B. licheniformis </it>genome. The availability of a completed genome sequence for <it>B. licheniformis </it>should facilitate the design and construction of improved industrial strains and allow for comparative genomics and evolutionary studies within this group of Bacillaceae.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010014">Microbiology and parasitology</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010009">Genetics</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010001">Biochemistry and structural biology</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p><it>Bacillus licheniformis </it>is a Gram-positive, spore-forming bacterium widely distributed as a saprophytic organism in the environment. This species is a close relative of <it>Bacillus subtilis</it>, an organism that is second only to <it>Escherichia coli </it>in the level of detail at which it has been studied. Unlike most other bacilli, which are predominantly aerobic, <it>B. licheniformis </it>is a facultative anaerobe, which may allow it to grow in additional ecological niches. Certain <it>B. licheniformis </it>isolates are capable of denitrification; the relevance of this characteristic to environmental denitrification may be small, however, as the species generally persists in soil as endospores <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>.</p>
         <p>There are numerous commercial and agricultural uses for <it>B. licheniformis </it>and its extracellular products. The species has been used for decades in the manufacture of industrial enzymes including several proteases, &#945;-amylase, penicillinase, pentosanase, cycloglucosyltransferase, &#946;-mannanase and several pectinolytic enzymes. The proteases from <it>B. licheniformis </it>are used in the detergent industry as well as for dehairing and bating of leather <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>. Amylases from <it>B. licheniformis </it>are deployed for the hydrolysis of starch, desizing of textiles and sizing of paper <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. Specific <it>B. licheniformis </it>strains are also used to produce peptide antibiotics such as bacitracin and proticin in addition to a number of specialty chemicals such as citric acid, inosine, inosinic acid and poly-&#947;-glutamic acid <abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. Some <it>B. licheniformis </it>isolates can mitigate the affects of fungal pathogens on maize, grasses and vegetable crops <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. As an endospore-forming bacterium, the ability of the organism to survive under unfavorable environmental conditions may enhance its potential as a natural biocontrol agent.</p>
         <p><it>B. licheniformis </it>can be differentiated from other bacilli on the basis of metabolic and physiological tests <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr></abbrgrp>; however, biochemical and phenotypic characteristics may be ambiguous among closely related species. Recent taxonomic studies indicate that <it>B. licheniformis </it>is closely related to <it>B. subtilis </it>and <it>Bacillus amyloliquefaciens </it>on the basis of comparisons of 16S rDNA and 16S-23S internal transcribed spacer (ITS) nucleotide sequences <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Lapidus <it>et al. </it><abbrgrp><abbr bid="B9">9</abbr></abbrgrp> recently constructed a physical map of the <it>B. licheniformis </it>chromosome using a PCR approach, and established a number of regions of colinearity where gene content and organization were conserved with the <it>B. subtilis </it>genome.</p>
         <p>Given that <it>B. licheniformis </it>is an industrial organism used for the manufacture of enzymes, antibiotics, and chemicals, important in nutrient cycling in the environment, and a species that is taxonomically related to <it>B. subtilis</it>, perhaps the best studied of all Gram-positive bacteria, we derived the complete nucleotide sequence of the <it>B. licheniformis </it>type strain (ATCC 14580) genome. With this data in hand, functional and comparative genomics studies can be initiated that may ultimately lead to new strategies for improving industrial strains as well as better understanding of genome evolution among the species within the <it>subtilis-licheniformis </it>group.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>General features of the <it>B. licheniformis </it>genome</p>
            </st>
            <p>The genome of <it>B. licheniformis </it>ATCC 14580 consists of a circular chromosome of 4,222,336 base-pairs (bp) with an average G+C content of 46.2% (Table <tblr tid="T1">1</tblr>). No plasmids were found during the genome analysis, and none were found by agarose gel electrophoresis (data not shown). Using a combination of several gene-finding programs and manual inspection, 4,208 protein-coding sequences (CDSs) were predicted. These CDSs constitute 87% of the genome and have an average length of 873 bp (ranging from 78 to 10,767 bp). They are oriented on the chromosome primarily in the direction of replication (Figure <figr fid="F1">1</figr>) with 74.4% of the genes on the leading strand and 25.6% on the lagging strand. Among the 4,208 protein coding genes, 3,948 (94%) had significant similarity to proteins in PIR, 3,187 (76%) of these gene models contain Interpro motifs, and 2,895 (69%) contain protein motifs found in PFAM. The number of hypothetical and conserved hypothetical proteins in the <it>B. licheniformis </it>genome with hits in the PIR database was 1,318 (212 conserved hypothetical proteins). Among the list of hypothetical and conserved hypothetical gene products, 683 (52%) have protein motifs contained in PFAM (148 conserved hypothetical proteins). There are 72 tRNA genes representing all 20 amino acids and seven rRNA operons.</p>
            <tbl id="T1" hint_layout="double">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Features of the <it>B. licheniformis </it>genome and comparison with genomes of other <it>Bacillus </it>species</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c ca="left">
                        <p>Feature</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>B. licheniformis</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p><it>B. subtilis</it>*</p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>B. halodurans</it>
                           <sup>&#8224;</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>Oceanobacillus iheyensis</it>
                           <sup>&#8225;</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>B. anthracis</it>
                           <sup>&#167;</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>B. cereus</it>
                           <sup>&#182;</sup>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chromosome size (bp)</p>
                     </c>
                     <c ca="center">
                        <p>4,222,336</p>
                     </c>
                     <c ca="center">
                        <p>4,214,630</p>
                     </c>
                     <c ca="center">
                        <p>4,202,352</p>
                     </c>
                     <c ca="center">
                        <p>3,630,528</p>
                     </c>
                     <c ca="center">
                        <p>5,227,293</p>
                     </c>
                     <c ca="center">
                        <p>5,426,909</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>G+C content (mol%)</p>
                     </c>
                     <c ca="center">
                        <p>46.2</p>
                     </c>
                     <c ca="center">
                        <p>43.5</p>
                     </c>
                     <c ca="center">
                        <p>43.7</p>
                     </c>
                     <c ca="center">
                        <p>35.7</p>
                     </c>
                     <c ca="center">
                        <p>35.4</p>
                     </c>
                     <c ca="center">
                        <p>35.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Protein coding sequences</p>
                     </c>
                     <c ca="center">
                        <p>4,208</p>
                     </c>
                     <c ca="center">
                        <p>4,106</p>
                     </c>
                     <c ca="center">
                        <p>4,066</p>
                     </c>
                     <c ca="center">
                        <p>3,496</p>
                     </c>
                     <c ca="center">
                        <p>5,508</p>
                     </c>
                     <c ca="center">
                        <p>5,366</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Average length (bp)</p>
                     </c>
                     <c ca="center">
                        <p>873</p>
                     </c>
                     <c ca="center">
                        <p>896</p>
                     </c>
                     <c ca="center">
                        <p>879</p>
                     </c>
                     <c ca="center">
                        <p>883</p>
                     </c>
                     <c ca="center">
                        <p>800</p>
                     </c>
                     <c ca="center">
                        <p>835</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Percent of coding region</p>
                     </c>
                     <c ca="center">
                        <p>86</p>
                     </c>
                     <c ca="center">
                        <p>87</p>
                     </c>
                     <c ca="center">
                        <p>85</p>
                     </c>
                     <c ca="center">
                        <p>85</p>
                     </c>
                     <c ca="center">
                        <p>84</p>
                     </c>
                     <c ca="center">
                        <p>84</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Ribosomal RNA operons</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Number of tRNAs</p>
                     </c>
                     <c ca="center">
                        <p>72</p>
                     </c>
                     <c ca="center">
                        <p>86</p>
                     </c>
                     <c ca="center">
                        <p>78</p>
                     </c>
                     <c ca="center">
                        <p>69</p>
                     </c>
                     <c ca="center">
                        <p>95</p>
                     </c>
                     <c ca="center">
                        <p>108</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Phage-associated genes</p>
                     </c>
                     <c ca="center">
                        <p>71</p>
                     </c>
                     <c ca="center">
                        <p>268</p>
                     </c>
                     <c ca="center">
                        <p>42</p>
                     </c>
                     <c ca="center">
                        <p>27</p>
                     </c>
                     <c ca="center">
                        <p>62</p>
                     </c>
                     <c ca="center">
                        <p>124</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transposase genes of IS elements</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>93</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Kunst <it>et al. </it>[10]; <sup>&#8224;</sup>Takami <it>et al. </it>[13]; <sup>&#8225;</sup>Takami <it>et al. </it>[16]; <sup>&#167;</sup>Read <it>et al. </it>[61]; <sup>&#182;</sup>Ivanova <it>et al. </it>[62].</p>
               </tblfn>
            </tbl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Circular representation of the <it>B. licheniformis </it>ATCC 14580 chromosome</p>
               </caption>
               <text>
                  <p>Circular representation of the <it>B. licheniformis </it>ATCC 14580 chromosome. Circles are numbered from 1 (outermost) to 7 (innermost). Circles 1 and 2 show the locations of predicted CDSs on the + and - strands, respectively; circle 3, %G+C; circle 4, GC skew ((G-C/G+C)); circle 5, homology with <it>B. subtilis </it>168; circle 6, homology with <it>B. halodurans</it>; circle 7 shows positions of nine copies of insertion sequence element <it>IS3Bli1 </it>and a putative transposase gene; small green bars inside circle 7 denote the positions of possible prophage elements.</p>
               </text>
               <graphic file="gb-2004-5-10-r77-1"/>
            </fig>
            <p>The likely origin of replication (Figure <figr fid="F1">1</figr>) was identified by similarities to several features of the corresponding regions in <it>B. subtilis </it>and other bacteria. These included co-localization of four genes (<it>rpmH</it>, <it>dnaA</it>, <it>dnaN</it>, and <it>recF</it>) near the origin, GC nucleotide skew ((G-C)/(G+C)) analysis, and the presence of multiple <it>dnaA</it>-boxes and AT-rich sequences immediately upstream of the <it>dnaA </it>gene <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. On the basis of these observations we assigned a cytosine residue of the <it>Bst</it>BI restriction site between the <it>rpmH </it>and <it>dnaA </it>genes to be the first nucleotide of the <it>B. licheniformis </it>genome. The replication termination site was localized near 2.02 megabases (Mb) by GC skew analysis. This region lies roughly opposite the origin of replication (Figure <figr fid="F1">1</figr>). Unlike <it>B. subtilis</it>, there was no apparent gene encoding a replication terminator protein (<it>rtp</it>) in <it>B. licheniformis</it>. The <it>Bacillus halodurans </it>genome also lacks an obvious <it>rtp </it>function <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>; therefore, it seems likely that <it>B. subtilis </it>acquired the <it>rtp </it>gene following its divergence from <it>B. halodurans </it>and <it>B. licheniformis</it>.</p>
         </sec>
         <sec>
            <st>
               <p>Transposable elements, prophages and atypical regions</p>
            </st>
            <p>The genome of <it>B. licheniformis </it>ATCC 14580 contains nine identical copies of a 1,285 bp insertion sequence element termed <it>IS3Bli1 </it><abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. This sequence shares a number of features with other <it>IS3 </it>family elements <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> including direct repeats of 3-5 bp, a 10-bp left inverted repeat, and a 9 bp right inverted repeat (Figure <figr fid="F2">2</figr>). <it>IS3Bli1 </it>encodes two predicted overlapping CDSs, designated <it>orfA </it>and <it>orfB </it>in relative translational reading frames of 0 and -1. The presence of a 'slippery heptamer' motif, AAAAAAG, before the stop codon in <it>orfA </it>may indicate that programmed translational frameshifting occurs between these two coding sequences, resulting in a single gene product <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. The <it>orfB </it>gene product harbors the DD(35)E(7)K motif, a highly conserved pattern among insertion sequences. Eight of these <it>IS3Bli1 </it>elements lie in intergenic regions, and one interrupts the <it>comP </it>gene as noted previously <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. In addition to these insertion sequences, the genome encodes a putative transposase that is most closely related (E = 1.8 &#215; 10<sup>-11</sup>) to one identified in the <it>Thermoanaerobacter tengcongensis </it>genome <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>; however, similar transposase genes are also found in the chromosomes of <it>B. halodurans </it><abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, <it>Oceanobacillus iheyensis </it><abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, <it>Streptococcus agalactiae </it><abbrgrp><abbr bid="B17">17</abbr></abbrgrp> and <it>Streptococcus pyogenes </it><abbrgrp><abbr bid="B18">18</abbr></abbrgrp>.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Schematic map of the insertion sequence <it>IS3Bli1</it></p>
               </caption>
               <text>
                  <p>Schematic map of the insertion sequence <it>IS3Bli1</it>. Nine identical copies of this 1,285-bp element were found in the genome of <it>B. licheniformis </it>ATCC 14580. Features of the <it>IS3Bli1 </it>element are summarized in the text.</p>
               </text>
               <graphic file="gb-2004-5-10-r77-2"/>
            </fig>
            <p>The presence of several bacteriophage lysogens or prophage-like elements was revealed by Smith-Waterman comparisons to other bacterial genomes and by their AT-rich signatures (Figure <figr fid="F3">3</figr>, Table <tblr tid="T2">2</tblr>). Prophage sequences, designated NZP1 and NZP3 (similar to <it>B. subtilis </it>prophages PBSX and &#966;-105), were discovered by noting the presence of nearby genes that code for the large subunit of terminase, a signature protein that is highly conserved among prophages <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. Interestingly, a terminase gene was not observed in the third putative prophage, termed NZP2 (similarity to <it>B. subtilis </it>phage SPP1); however, its absence may be the result of genome deterioration during evolution. Interestingly, we observed that regions in which the G+C content is less than 39% usually encoded proteins that have no <it>B. subtilis </it>ortholog and share identity only with hypothetical and conserved hypothetical genes. Two of these AT-rich segments correspond to the NZP2 and NZP3 prophages.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Isochore plot of the <it>B. licheniformis </it>ATCC 14580 genome showing G+C content as a function of position</p>
               </caption>
               <text>
                  <p>Isochore plot of the <it>B. licheniformis </it>ATCC 14580 genome showing G+C content as a function of position. AT-rich peaks (numbered 1-24) are marked on the plot, and a single island that is atypically GC-rich is indicated by number 25. Table 2 lists the specific chromosomal features represented by each numbered peak.</p>
               </text>
               <graphic file="gb-2004-5-10-r77-3"/>
            </fig>
            <tbl id="T2" hint_layout="double">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Gene sequences corresponding to isochore peaks shown in Figure 3</p>
               </caption>
               <tblbdy cols="5">
                  <r>
                     <c ca="left">
                        <p>Peak</p>
                     </c>
                     <c ca="center">
                        <p>Size (kb)</p>
                     </c>
                     <c ca="center">
                        <p>% G+C</p>
                     </c>
                     <c ca="center">
                        <p><it>B. subtilis </it>orthologs</p>
                     </c>
                     <c ca="left">
                        <p>Annotation</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="5">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>3.2</p>
                     </c>
                     <c ca="center">
                        <p>28</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>ABC transporter, conserved hypothetical, and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>3.6</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>2.1</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>2.8</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2.7</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Phosphotriesterase, conserved hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>7.4</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Type I restriction-modification system</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>3.5</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>8.4</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>Partial</p>
                     </c>
                     <c ca="left">
                        <p><it>yybO</it>, <it>pucR</it>, <it>pucH</it>, <it>yurH</it>, <it>ycbE</it>, <it>yjfA</it>, <it>rapG</it>, carbamate kinase, conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>10.1</p>
                     </c>
                     <c ca="center">
                        <p>36</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>SPP-1 like phage, conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>4.8</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="left">
                        <p>Hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>3.0</p>
                     </c>
                     <c ca="center">
                        <p>33</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>4.3</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>2.2</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>5.4</p>
                     </c>
                     <c ca="center">
                        <p>36</p>
                     </c>
                     <c ca="center">
                        <p>Partial</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>15</p>
                     </c>
                     <c ca="center">
                        <p>4.4</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>16</p>
                     </c>
                     <c ca="center">
                        <p>4.6</p>
                     </c>
                     <c ca="center">
                        <p>33</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>ABC transporter and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>17</p>
                     </c>
                     <c ca="center">
                        <p>3.5</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>Partial</p>
                     </c>
                     <c ca="left">
                        <p><it>comP</it>, <it>comX</it>, <it>comQ</it>, and <it>IS3Bli1</it></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>6.8</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p><it>IS3Bli1</it>, conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>19</p>
                     </c>
                     <c ca="center">
                        <p>3.8</p>
                     </c>
                     <c ca="center">
                        <p>38</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Phage w-105-like genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>20</p>
                     </c>
                     <c ca="center">
                        <p>6.8</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="left">
                        <p><it>tagG </it>and <it>tagF </it>genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>21</p>
                     </c>
                     <c ca="center">
                        <p>3.2</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>1.7</p>
                     </c>
                     <c ca="center">
                        <p>34</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Conserved hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>23</p>
                     </c>
                     <c ca="center">
                        <p>1.6</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>24</p>
                     </c>
                     <c ca="center">
                        <p>16.2</p>
                     </c>
                     <c ca="center">
                        <p>35</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Type I restriction-modification system, conserved hypothetical and hypothetical genes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>25</p>
                     </c>
                     <c ca="center">
                        <p>3.3</p>
                     </c>
                     <c ca="center">
                        <p>62</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="left">
                        <p>Hypothetical gene</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>An isochore plot (Figure <figr fid="F3">3</figr>) also revealed the presence of a region with an atypically high (62%) G+C content. This segment contains two hypothetical genes whose sizes (3,831 and 2,865 bp) greatly exceed the size of an average CDS in <it>B. licheniformis</it>. The first gene encodes a protein of 1,277 amino acids for which Interpro predicts 16 collagen triple-helix repeats, and the amino acid pattern TGATGPT is repeated 75 times within the polypeptide. The second CDS is smaller, and encodes a protein with 11 collagen triple-helix repeats; the same TGATGPT motif recurs 56 times. The primary translation products from these genes do not contain canonical signal peptides for secretion, and they do not contain motifs for the twin-arginine or sortase-mediated translocation pathways. Therefore, it is not likely that they are exported to the cell surface or the extracellular medium. Interestingly, the chromosomal region (19 kb) adjacent to these genes is clearly non-colinear with the <it>B. subtilis </it>genome, and virtually all of the predicted genes encode hypothetical or conserved hypothetical proteins. There are a number of bacterial proteins listed in PIR that also contain collagen triple-helix repeat regions, including two from <it>Mesorhizobium loti </it>(accession numbers NF00607049 and NF00607035) and three from <it>B. cereus </it>(accession numbers NF01692528, NF01269899 and NF01694666). These putative orthologs share 53-76% amino-acid sequence identity with their counterparts in <it>B. licheniformis</it>, and their functions are unknown.</p>
         </sec>
         <sec>
            <st>
               <p>Extracellular enzymes and metabolic activities</p>
            </st>
            <p>In the <it>Bacillus licheniformis </it>genome, 689 of the 4,208 gene models have signal peptides forecast by SignalP <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>. Of these, 309 have no transmembrane domain predicted by TMHMM <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> and 134 are hypothetical or conserved hypothetical genes. Based on a manual examination of the remaining 175 genes, at least 82 are likely to encode secreted proteins and enzymes. Moreover, there are 27 predicted extracellular proteins encoded by the <it>B. licheniformis </it>ATCC 14580 genome that are not found in <it>B. subtilis </it>168. In accordance with its saprophytic lifestyle, the secretome of <it>B. licheniformis </it>encodes numerous secreted enzymes that hydrolyze polysaccharides, proteins, lipids and other nutrients.</p>
            <p>Cellulose is the most abundant polysaccharide on Earth, and microorganisms that hydrolyze cellulose contribute to the global carbon cycle. Interestingly, two gene clusters involved in cellulose degradation and utilization were discovered in <it>B. licheniformis</it>, and there are no counterparts in <it>B. subtilis </it>168. The enzymes encoded by the first gene cluster include two putative endoglucanases belonging to glycoside hydrolase families GH9 and GH5, a probable cellulose-1,4-&#946;-cellobiosidase of family GH48, and a putative &#946;-mannanase of family GH5. The &#946;-mannanase (GH5) and endoglucanase (GH9) both harbor carbohydrate-binding motifs. With the exception of the cellulose-1,4-&#946;-cellobiosidase (GH48), all of the gene products encoded in this cluster have secretory signal peptides, and all have homologs in <it>Bacillus </it>species other than <it>B. subtilis</it>. The overall G+C content of this cluster (48%) does not appear to differ appreciably from that of the genome average (46%). The second gene cluster encodes a putative &#946;-glucosidase (GH1) and three components of a cellobiose-specific PTS transport complex. A second &#946;-glucosidase (GH3) gene is present at an unlinked locus in the genome. Collectively, the genes in these two clusters should enable <it>B. licheniformis </it>to utilize cellulose as a carbon and energy source, converting it to cellobiose and ultimately glucose. In this regard, we have confirmed that <it>B. licheniformis </it>ATCC 14580 is capable of growth on carboxymethyl cellulose as a sole carbon source (not shown). The chromosome of <it>B. licheniformis </it>ATCC 14580 encodes a number of additional carbohydrase activities that may allow the organism to grow on a broad range of polysaccharides. These include xylanase, endo-arabinase and pectate lyase that may be involved in degradation of hemicellulose, &#945;-amylase and &#945;-glucosidase for starch hydrolysis, chitinases for the breakdown of chitooligosaccharides from fungi and insects, and levanase for utilization of &#946;-D-fructans (levans). Several of these activities are marketed as industrial enzymes.</p>
            <p>Saprophytic organisms must utilize a variety of nitrogenous compounds as nutrients for growth and metabolism. On the basis of the information encoded in its genome, <it>B. licheniformis </it>ATCC 14580 possesses the ability to acquire nitrogen from exogenous proteins, peptides, amino acids, ammonia, nitrate and nitrite. Like <it>B. subtilis</it>, the repertoire of extracellular proteases produced by <it>B. licheniformis </it>includes serine proteases (<it>aprE</it>, <it>epr</it>, <it>vpr</it>), metalloprotease (<it>mpr</it>), and an assortment of endo- and exopeptidases (<it>yjbG</it>, <it>ydiC</it>, <it>gcp</it>, <it>ykvY</it>, <it>ampS</it>, <it>bpr </it>(two copies), <it>yfxM</it>, <it>yuiE</it>, <it>yusX</it>, <it>ywaD</it>, <it>pepT</it>). However, <it>B. licheniformis </it>also has the capacity to produce a number of additional proteases and peptidases that are not encoded in the <it>B. subtilis </it>genome. These include a clostripain-like protease, a zinc-metallopeptidase, a probable glutamyl endopeptidase, an aminopeptidase C homolog, two putative dipeptidases and a zinc-carboxypeptidase.</p>
            <p><it>B. licheniformis </it>also has the ability to utilize amino and imino nitrogen from arginine, asparagine and glutamine via arginine deiminase, arginase, asparaginase and glutaminase activities. Interestingly, there appear to be two genes each for arginase, asparaginase and glutaminase. Presumably, the arginine deiminase activity is expressed during anaerobic growth on arginine, whereas the arginase activities are predominant during aerobic growth. The occurrence of putative arginase genes is somewhat of an enigma in <it>B. licheniformis</it>, because there are no genes encoding urease activity for the hydrolysis of urea that is generated by the arginase reaction. In addition to the absence of urease gene homologs (<it>ureABC</it>) in <it>B. licheniformis</it>, the glutamine ABC transporters (<it>glnH</it>, <it>glnM</it>, <it>glnP</it>, <it>glnQ </it>gene products) are also lacking.</p>
            <p>It appears that nitrogen assimilation and transport pathways may be coordinated similarly in <it>B. licheniformis </it>and <it>B. subtilis </it>owing to the presence of key genes such as <it>glnA</it>, <it>glnR</it>, <it>tnrA </it>and <it>nrgA </it>in both species. Likewise, the pathways for nitrate/nitrite transport and metabolism in <it>B. licheniformis </it>appear to be analogous to the corresponding pathways in <it>B. subtilis </it>as suggested by the presence of <it>nasABC </it>(nitrate transport), <it>narGHIJ </it>(respiratory nitrate reductase), and <it>nasDEF </it>(NADH-dependent nitrite reductase) genes. Unlike <it>B. subtilis</it>, <it>B. licheniformis </it>evidently possesses the capability for anaerobic respiration using nitric oxide reductase. Moreover, the gene encoding this activity lies in a cluster that includes CDSs for <it>narK </it>(nitrite extrusion protein), two putative <it>fnr </it>proteins (transcriptional regulators of anaerobic growth), and a <it>dnrN</it>-like gene product (nitric oxide-dependent regulator). These observations are consistent with previous findings that certain <it>B. licheniformis </it>isolates are capable of denitrification <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. While denitrification is a process of major ecological importance, the contribution of <it>B. licheniformis </it>may be small as the species exists predominantly as endospores in soil <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>.</p>
            <p>Microbial D-hydantoinase enzymes have been applied to the industrial production of optically pure D-amino acids for synthesis of antibiotics, pesticides, sweeteners and therapeutic amino acids <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. This enzyme catalyzes the hydrolysis of cyclic ureides such as dihydropyrimidines and 5-monosubstituted hydantoins to <it>N</it>-carbamoyl amino acids. Hydantoinase activities have been detected in a variety of bacterial genera, and a cluster of six genes in <it>B. licheniformis </it>appears to confer a similar capability. This gene cluster encodes <it>N</it>-methylhydantoinase (ATP-hydrolyzing), hydantoin utilization proteins A and B (<it>hyuAB </it>homologs), a possible transcriptional regulator (TetR/AcrR family), a putative pyrimidine permease, and a hypothetical protein that contains an Interpro domain (IPR004399) for phosphomethylpyrimidine kinase.</p>
         </sec>
         <sec>
            <st>
               <p>Protein export, sporulation and competence pathways</p>
            </st>
            <p>Kunst <it>et al</it>. <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> listed 18 genes that have a major role in the secretion of extracellular enzymes by the classical (Sec) pathway in <it>B. subtilis </it>168. This list includes several chaperonins, signal peptidases, components of the signal recognition particle and protein translocase complexes. All members of this list have <it>B. licheniformis </it>counterparts. In addition to the Sec pathway, some <it>B. subtilis </it>proteins are directed into the twin-arginine (Tat) export pathway, possibly in a Sec-independent manner. Curiously, the <it>B. licheniformis </it>genome encodes three <it>tat </it>gene orthologs (<it>tatAY</it>, <it>tatCD</it>, and <it>tatCY</it>), but two others (<it>tatAC </it>and <it>tatAD</it>) are conspicuously absent. Furthermore, specific proteins may be exported to the cell surface via lipoprotein signal peptides or sortase factors. Lipoprotein signal peptides are cleaved with a specific signal peptidase (Lsp) encoded by the <it>lspA </it>gene in <it>B. subtilis</it>. An <it>lspA </it>homolog can be found in <it>B. licheniformis </it>as well, suggesting that this species may possess the ability to export lipoproteins via a similar mechanism. Lastly, surface proteins in Gram-positive bacteria are frequently attached to the cell wall by sortase enzymes, and genome analyses have revealed that more than one sortase is often produced by a given species. In this regard, three possible sortase gene homologs were detected in the genome of <it>B. licheniformis </it>ATCC 14580. Together these observations suggest that the central features of the protein export machinery are principally conserved in <it>B. subtilis </it>and <it>B. licheniformis</it>.</p>
            <p>From the list of 139 sporulation genes tabulated by Kunst <it>et al</it>. <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, all but six have obvious counterparts in <it>B. licheniformis</it>. These six exceptions (<it>spsABCEFG</it>) comprise an operon involved in synthesis of a spore coat polysaccharide in <it>B. subtilis</it>. In addition, the response regulator gene family (<it>phrACEFGI</it>) appears to have a low level of sequence conservation between <it>B. subtilis </it>and <it>B. licheniformis</it>.</p>
            <p>Natural competence (the ability to take up and process exogenous DNA in specific growth conditions) is a feature of few <it>B. licheniformis </it>strains <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. The reasons for variability in competence phenotype have not been explored at the genetic level, but the genome data offer several possible explanations. Although the <it>B. licheniformis </it>genome encodes all of the late competence functions ascribed in <it>B. subtilis </it>(for example, <it>comC</it>, <it>comEFG </it>operons, <it>comK</it>, <it>mecA</it>), it lacks an obvious <it>comS </it>gene, and the <it>comP </it>gene is punctuated by an insertion sequence element (<it>IS3Bli1</it>), suggesting that the early stages of competence development have been pre-empted in <it>B. licheniformis </it>ATCC 14580. Whether these early functions can be restored by introducing the corresponding genes from <it>B. subtilis </it>is unknown. In addition to an apparent deficiency in DNA uptake, two type I restriction-modification systems were discovered that may also contribute to diminished transformation efficiencies. These are distinct from the <it>ydiOPS </it>genes of <it>B. subtilis</it>, and could participate in degradation of improperly modified DNA from heterologous hosts used during construction of recombinant expression vectors. Each of these loci in <it>B. licheniformis </it>(designated as <it>BliI </it>and <it>BliII</it>) encode putative HsdS, HsdM and HsdR subunits that share significant amino-acid sequence identity to type I restriction-modification proteins in other bacteria. Curiously, the G+C-content for these loci (37%) is substantially lower than the overall genome average (46%) which may hint that they are the result of gene acquisitions. Lastly, the synthesis of a glutamyl polypeptide capsule has also been implicated as a potential barrier to transformation of <it>B. licheniformis </it>strains <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. While laboratory strains of <it>B. subtilis </it>usually do not produce significant capsular material, the genome sequence of <it>B. subtilis </it>168 indicates that they may harbor the genes required for synthesis of polyglutamic acid. In contrast, many <it>B. licheniformis </it>isolates produce copious amounts of capsular material, giving rise to colonies with a wet or slimy appearance. Six genes were predicted (<it>ywtABDEF </it>and <it>ywsC </it>orthologs) that may be involved in the synthesis of polyglutamic acid capsular material in <it>B. licheniformis</it>.</p>
         </sec>
         <sec>
            <st>
               <p>Antibiotics, secondary metabolites and siderophores</p>
            </st>
            <p>Bacitracin is a cyclic peptide antibiotic that is synthesized non-ribosomally by some <it>B. licheniformis </it>isolates <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. While there is variation in the prevalence of bacitracin synthase genes among laboratory strains of this species, one study suggested that up to 50% may harbor the <it>bac </it>operon <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. Interestingly, the <it>bac </it>operon is not present in the type strain (ATCC 14580) genome. Seemingly, the only non-ribosomal peptide synthase operon encoded by the <it>B. licheniformis </it>type strain genome is that responsible for lichenysin biosynthesis. Lichenysin structurally resembles surfactin from <it>B. subtilis </it><abbrgrp><abbr bid="B28">28</abbr></abbrgrp>, and their respective biosynthetic operons are highly similar. Surprisingly, we found no <it>B. licheniformis </it>counterparts for the <it>pps </it>(plipastatin synthase) and polyketide synthase (<it>pks</it>) operons of <it>B. subtilis</it>. Collectively, these two regions represent sizeable portions (80 kb and 38 kb, respectively) of the chromosome in <it>B. subtilis</it>, although they are reportedly dispensable <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>.</p>
            <p>Unexpectedly, a cluster of 11 genes was found encoding a lantibiotic, with its associated modification and transport functions. We designated this peptide of 75 amino acids as lichenicidin, and its closest homolog is mersacidin from <it>Bacillus </it>sp. strain HIL-Y85/54728 <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. Lantibiotics are ribosomally synthesized peptides that are modified post-translationally so that the final molecules contain rare thioether amino acids such as lanthionine and/or methyl-lanthionine <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. Like mersacidin, lichenicidin appears to be a type B lantibiotic, comprising a rigid globular peptide with no net charge (7 acidic residues, 7 basic residues) and a leader peptide with a conserved double glycine cleavage site (GG-type leader peptide). These antimicrobial compounds have attracted much attention in recent years as models for the design and genetic engineering of improved antimicrobial agents <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. However, since several post-translational modifications and product-specific export functions are required, a dedicated expression system is a prerequisite to provide all the factors necessary to synthesize, modify and transport the lantibiotic peptide. With its history of use in industrial microbiology, <it>B. licheniformis </it>may be an attractive candidate for the development of such an expression system.</p>
            <p>Like <it>B. subtilis </it>168, the <it>B. licheniformis </it>ATCC 14580 chromosome harbors a siderophore biosynthesis gene cluster (<it>dhbABCEF</it>), and the organization of the cluster is similar to the corresponding chromosomal segment in <it>B. subtilis</it>. In addition, the <it>B. licheniformis </it>genome contains a second gene cluster of four genes (<it>iucABCD</it>) that show significant similarity to proteins involved in aerobactin biosynthesis in <it>E. coli</it>. Surprisingly, a gene encoding the receptor protein (<it>iutA </it>homolog) was not found in <it>B. licheniformis</it>. The <it>B. halodurans </it>genome also contains genes that are homologous to <it>iucABCD</it>, but like <it>B. licheniformis</it>, no <it>iutA </it>homolog could be found using BLAST or Smith-Waterman searches.</p>
         </sec>
         <sec>
            <st>
               <p>Comparison of the <it>B. licheniformis </it>genome with those of other bacilli</p>
            </st>
            <p>The <it>B. licheniformis </it>ATCC 14580 gene models were compared to the list of essential genes in <it>B. subtilis </it><abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. Predictably, all of the essential genes in <it>B. subtilis </it>have orthologs in <it>B. licheniformis</it>, and most are present in a wide range of bacterial taxa. In pairwise BLAST comparisons, 66% of the predicted <it>B. licheniformis </it>genes have orthologs in <it>B. subtilis</it>, and 55% of the gene models are represented by orthologous sequences in <it>B. halodurans </it>(E-value threshold of 1 &#215; 10<sup>-5</sup>; Figure <figr fid="F4">4</figr>). Using a reciprocal BLASTP analysis we found 1,719 orthologs that are common to all three species (E-value threshold of 1 &#215; 10<sup>-5</sup>).</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Venn diagram comparing the orthologous gene complements of <it>B. licheniformis </it>ATCC 14580, <it>B. subtilis </it>168 and <it>B. halodurans </it>C-125</p>
               </caption>
               <text>
                  <p>Venn diagram comparing the orthologous gene complements of <it>B. licheniformis </it>ATCC 14580, <it>B. subtilis </it>168 and <it>B. halodurans </it>C-125. Numbers in purple boxes indicate the number of pairwise orthologs between adjacent species (BLAST threshold E = 1 &#215; 10<sup>-5</sup>). Numbers in the outer circles represent the total number of CDSs predicted in each genome, numbers in areas of overlap indicate the number of orthologs predicted by reciprocal BLASTP analysis (threshold E = 1 &#215; 10<sup>-5</sup>), and the number in the center gives the number of orthologous sequences common to all three genomes.</p>
               </text>
               <graphic file="gb-2004-5-10-r77-4"/>
            </fig>
            <p>As noted by Lapidus <it>et al. </it><abbrgrp><abbr bid="B9">9</abbr></abbrgrp>, there are broad regions of colinearity between the genomes of <it>B. licheniformis </it>and <it>B. subtilis </it>(Figure <figr fid="F5">5</figr>). Less conservation of genome organization exists between <it>B. licheniformis </it>and <it>B. halodurans</it>, and substantial genomic segments have been inverted in <it>B. halodurans </it>with respect to <it>B. licheniformis </it>and <it>B. subtilis</it>. These observations clearly support previous hypotheses <abbrgrp><abbr bid="B8">8</abbr></abbrgrp> that <it>B. subtilis </it>and <it>B. licheniformis </it>are phylogenetically and evolutionarily closer to each other than to <it>B. halodurans</it>.</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Two- and three-dimensional similarity plots comparing the distribution of orthologs on the chromosomes of <it>B. licheniformis</it>, <it>B. subtilis </it>and <it>B. halodurans</it></p>
               </caption>
               <text>
                  <p>Two- and three-dimensional similarity plots comparing the distribution of orthologs on the chromosomes of <it>B. licheniformis</it>, <it>B. subtilis </it>and <it>B. halodurans</it>. BLAST scores were generated and dots were positioned according to the locations in the genome where orthologs exist in order to view possible regions of possible colinearity. The minimum BLAST expectancy score for each dot in this example was 1 &#215; 10<sup>-50</sup>. <b>(a) </b>The plot for <it>B. licheniformis </it>versus <it>B. subtilis</it>; <b>(b) </b><it>B. halodurans </it>versus <it>B. subtilis</it>; <b>(c) </b><it>B. licheniformis </it>versus <it>B. halodurans</it>; <b>(d) </b>a three-dimensional scatter plot comparing the distribution of orthologs among all three species. Dots located on the diagonal are indicative of conserved location of orthologous genes between species, whereas a line of dots that lie perpendicular to the diagonal suggests an inversion of a genomic segment between species.</p>
               </text>
               <graphic file="gb-2004-5-10-r77-5"/>
            </fig>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusions</p>
         </st>
         <p>In comparisons of shared regions, the genomes of <it>B. licheniformis </it>ATCC 14580 and <it>B. subtilis </it>168 are approximately 84.6% identical at the nucleotide level and show extensive organizational similarity. Accordingly, their genome sequences represent potentially useful instruments for comparative and evolutionary studies among species within the <it>subtilis-licheniformis </it>group, and they may offer new information regarding the evolution and ecology of these closely related species.</p>
         <p>Despite the broad colinearity of <it>B. licheniformis </it>and <it>B. subtilis </it>genomes, there are local regions that are individually unique. These include chromosome segments that comprise prophage and insertion sequence elements, DNA restriction-modification systems, antibiotic synthases, and a number of extracellular enzymes and metabolic activities that are not present in <it>B. subtilis</it>. It is tempting to speculate that the presence of these genes forecasts the ability of <it>B. licheniformis </it>to grow on an expanded array of substrates and/or in additional ecological niches compared to <it>B. subtilis</it>. Together, the similarities and differences may hint at overlapping but non-identical environmental niches for these taxa.</p>
         <p>The <it>subtilis-licheniformis </it>group of bacilli includes many strains that are used to manufacture industrial enzymes, antibiotics and biochemicals. The availability of a complete genome from <it>B. licheniformis </it>should permit a thorough comparison of the biochemical pathways and regulatory networks in <it>B. subtilis </it>and <it>B. licheniformis</it>, thereby offering new opportunities and strategies for improvement of industrial strains. When considering the safety of <it>B. licheniformis </it>as an industrial organism it should be noted that the species is considered neither a human pathogen nor a toxigenic microorganism <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>; however, there are reports in the literature implicating it as a causal agent of food poisoning. In these isolated cases, specific strains were shown to produce a toxin similar to cereulide, the emetic toxin of <it>B. cereus </it><abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. Cereulide is a cyclic depsipeptide synthesized non-ribosomally <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>. Importantly, the only non-ribosomal peptide synthase genes found in the <it>B. licheniformis </it>ATCC 14580 genome are those that involved in synthesis of lichenysin. Similarly, we detected no homologs of the <it>B. cereus </it>hemolytic and non-hemolytic enterotoxins (Swiss-Prot accession numbers P80567, P80568, P80172, and P81242).</p>
         <p>In a comparison of the genotypic and phenotypic characteristics among 182 soil isolates of <it>B. licheniformis</it>, Manachini <it>et al. </it><abbrgrp><abbr bid="B37">37</abbr></abbrgrp> observed that while this bacterial species appears to be phenotypically homogeneous, clear genotypic differences are evident between isolates. They postulated the existence of three genomovars for <it>B. licheniformis</it>. Similarly, De Clerck and De Vos <abbrgrp><abbr bid="B38">38</abbr></abbrgrp> proposed that this species consists of two lineages that can be distinguished using several molecular genotyping methods. The genome sequence data presented in this work should provide a solid foundation on which to conduct future studies to elucidate the genotypic variation among <it>B. licheniformis </it>isolates.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Shotgun DNA sequencing and genome assembly</p>
            </st>
            <p>The genome of <it>B. licheniformis </it>ATCC 14580 was sequenced by a combination of the whole-genome shotgun method <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> and fosmid end sequencing <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. Plasmid libraries were constructed using randomly sheared and <it>Mbo</it>I-digested genomic DNA that was enriched for fragments of 2-3 kb by preparative agarose gel electrophoresis. Approximately 49,000 random clones were sequenced using dye-terminator chemistry (Applied Biosystems) with ABI 377 and ABI 3700 automated sequencers yielding approximately 6&#215; coverage of the genome. A combination of methods was used for gap closure, including sequencing on fosmids <abbrgrp><abbr bid="B40">40</abbr></abbrgrp> and primer-walking on selected clones and PCR-amplified DNA fragments. We also incorporated data from both ends of approximately 1,975 fosmid clones with an average insert size of 40 kb to aid in validating the final assembly. In total, the number of input reads was 62,685, with 78.6% of these incorporated into the assembled genome sequence. Individual nucleotides were called using TraceTuner 2.0 (Paracel), and sequence reads were assembled into contigs using the Paracel Genome Assembler using optimized parameters and the quality score set to >20. Phrap, Crossmatch and Consed were used for sequence finishing <abbrgrp><abbr bid="B41">41</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Prediction and annotation of CDSs</p>
            </st>
            <p>Protein-coding regions in the assembled genome sequence were identified using a combination of previously described software tools including EasyGene <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>, Glimmer <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> and FrameD <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>. EasyGene was used as the primary gene finder in these studies. It searches for protein matches in the raw genome data to derive a good training set, and an HMM with states for coding regions as well as ribosome-binding sites (RBSs) is estimated from the dataset. This HMM is used to score all the predicted CDSs in the genome, and the score is converted to a measure of significance (R-value) which is the expected number of CDSs that would be predicted in 1 Mb of random DNA. Gene models with R-values lower than 10 and a log-odds score of greater than -10 were included/considered significant. The principal advantage of this significance measure is that it properly takes into account the length distribution of random CDSs. EasyGene has been shown to match or exceed other gene finders currently available <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>. Glimmer was used as a secondary gene finder to aid in identification of small genes (&lt; 100 bp) that were sometimes missed by EasyGene. Glimmer models were post-processed with RBSFINDER <abbrgrp><abbr bid="B45">45</abbr></abbrgrp> to pinpoint the positions of start codons by searching for consensus Shine-Dalgarno sequences. According to the RBS states in the EasyGene HMM model, the bases with the highest probability were AA<b>AAGGAG </b>(the bases in bold type had distinctly higher probabilities compared to the initial AA). This motif concurs with the consensus Shine-Dalgarno sequence for <it>B. subtilis </it>(AAAGGAGG) <abbrgrp><abbr bid="B46">46</abbr></abbrgrp>. RBSFINDER identified the core AAGGAG motif in around 80% of the cases for Glimmer gene predictions and adjusted the start codon accordingly. Manual inspection and alignments to <it>B. subtilis </it>homologs were also used to determine the incidence of specific genes. During the gene-finding process, possible errors and frameshifts were detected by both visual inspection of the CDSs to look for interrupted or truncated genes and by deploying FrameD software <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>. Frameshifts were resolved by re-sequencing of PCR-amplified segments or subclones. After re-sequencing and manual editing a total of 27 frameshifts remain in the genome assembly (excluding those contained in the <it>IS3Bli1 </it>elements). It is not known at present whether these represent pseudogenes or instances of programmed translational frameshifting. The positions of rRNA operons in the genome assembly were confirmed by long-range PCR amplification using primers that annealed to genes flanking the rRNA genes. These PCR fragments were sequenced to high redundancy and the consensus sequences were manually inserted into the assembly. Among the seven rRNA operons, the nucleotide sequences of 16S and 23S genes are at least 99% identical, differing by only one to three nucleotides in pairwise comparisons. Protein-coding sequences were annotated in an automated fashion with the following software applications. Predicted proteins were compared to the nonredundant database PIR-NREF <abbrgrp><abbr bid="B47">47</abbr></abbrgrp> and the <it>B. subtilis </it>genome <abbrgrp><abbr bid="B48">48</abbr></abbrgrp> using BLASTP with a E-value threshold of 1 &#215; 10<sup>-5</sup>. InterProScan was used to predict putative function <abbrgrp><abbr bid="B49">49</abbr></abbrgrp>. The InterPro analysis included comparison to PFAM <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>, TIGRFAM <abbrgrp><abbr bid="B51">51</abbr></abbrgrp>, Interpro <abbrgrp><abbr bid="B52">52</abbr></abbrgrp> signal peptide prediction using SignalP <abbrgrp><abbr bid="B20">20</abbr></abbrgrp> and transmembrane domain prediction using TMHMM <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. These CDSs were assigned to functional categories based on the Cluster of Orthologous Groups (COG) database <abbrgrp><abbr bid="B53">53</abbr></abbrgrp> with manual verification as described <abbrgrp><abbr bid="B54">54</abbr><abbr bid="B55">55</abbr></abbrgrp>. Phage gene boundaries were predicted using gene finding algorithms and by homology to known bacteriophage genes. Transfer RNA genes were identified using tRNAscan-SE <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>. <it>B. licheniformis </it>genes that shared significant homology with <it>B. subtilis </it>counterparts were named using the nomenclature in the SubtiList database <abbrgrp><abbr bid="B48">48</abbr></abbrgrp> with updated gene names from the BSORF <abbrgrp><abbr bid="B57">57</abbr></abbrgrp> and UniProt <abbrgrp><abbr bid="B58">58</abbr></abbrgrp> databases.</p>
         </sec>
         <sec>
            <st>
               <p>Comparative analyses</p>
            </st>
            <p>VisualGenome software (Rational Genomics) was used for comparisons of ortholog distribution among <it>B. licheniformis</it>, <it>B. subtilis </it>and <it>B. halodurans </it>genomes with precomputed BLAST results stored in a local database.</p>
         </sec>
         <sec>
            <st>
               <p>Accession of genome sequence information</p>
            </st>
            <p>The GenBank accession number for the <it>B. licheniformis </it>ATCC 14580 genome is CP000002. An interactive web portal for viewing and searching the assembled genome based on the generic genome browser developed by Stein <it>et al. </it><abbrgrp><abbr bid="B59">59</abbr></abbrgrp> is available at <abbrgrp><abbr bid="B60">60</abbr></abbrgrp>.</p>
         </sec>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We thank Alan Sloma, William Widner and Michael D. Thomas for helpful discussions.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <aug>
               <au>
                  <snm>Alexander</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Introduction to Soil Microbiology</source>
            <publisher>New York: John Wiley</publisher>
            <pubdate>1977</pubdate>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The microbial production of industrial chemicals.</p>
            </title>
            <aug>
               <au>
                  <snm>Eveleigh</snm>
                  <fnm>DE</fnm>
               </au>
            </aug>
            <source>Sci Am</source>
            <pubdate>1981</pubdate>
            <volume>245</volume>
            <fpage>155</fpage>
            <lpage>178</lpage>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Industrial applications of the bacilli: a review and prospectus.</p>
            </title>
            <aug>
               <au>
                  <snm>Erickson</snm>
                  <fnm>RJ</fnm>
               </au>
            </aug>
            <source>In Microbiology</source>
            <publisher>Washington: American Society for Microbiology</publisher>
            <editor>Schlesinger D</editor>
            <pubdate>1976</pubdate>
            <fpage>406</fpage>
            <lpage>419</lpage>
         </bibl>
         <bibl id="B4">
            <aug>
               <au>
                  <snm>Gherna</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Pienta</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Cote</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>American Type Culture Collection Catalogue of Bacteria and Phages</source>
            <publisher>Rockville: American Type Culture Collection</publisher>
            <pubdate>1989</pubdate>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Novel microbial technologies for the enhancement of plant growth and biocontrol of fungal diseases in crops.</p>
            </title>
            <aug>
               <au>
                  <snm>Neyra</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Atkinson</snm>
                  <fnm>LA</fnm>
               </au>
               <au>
                  <snm>Olubayi</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Sadasivan</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zaurov</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Zappi</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Cahiers Opt M&#233;d</source>
            <pubdate>1996</pubdate>
            <volume>31</volume>
            <fpage>447</fpage>
            <lpage>456</lpage>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Classification and identification of the genus <it>Bacillus </it>using API tests.</p>
            </title>
            <aug>
               <au>
                  <snm>Logan</snm>
                  <fnm>NA</fnm>
               </au>
               <au>
                  <snm>Berkeley</snm>
                  <fnm>RCW</fnm>
               </au>
            </aug>
            <source>In The Aerobic Endospore-Forming Bacteria: Classification and Identification</source>
            <publisher>London: Academic Press</publisher>
            <editor>Berkeley RCW, Goodfellow M</editor>
            <pubdate>1981</pubdate>
            <fpage>106</fpage>
            <lpage>140</lpage>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Characterization of <it>Bacillus subtilis</it>, <it>Bacillus pumilus</it>, <it>Bacillus licheniformis</it>, and <it>Bacillus amyloliquefaciens </it>by pyrolysis gas-liquid chromatography, deoxyribonucleic acid - deoxyribonucleic acid hybridization, biochemical tests, and API systems.</p>
            </title>
            <aug>
               <au>
                  <snm>O'Donnell</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Norris</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Berkeley</snm>
                  <fnm>RCW</fnm>
               </au>
               <au>
                  <snm>Claus</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kanero</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Logan</snm>
                  <fnm>NA</fnm>
               </au>
               <au>
                  <snm>Nozaki</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Int J Syst Bacteriol</source>
            <pubdate>1980</pubdate>
            <volume>30</volume>
            <fpage>448</fpage>
            <lpage>459</lpage>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Phylogenetic relationships between <it>Bacillus </it>species and related genera inferred from comparison of 3' end 16S rDNA and 5' end 16S-23S ITS nucleotide sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Xu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>C&#244;t&#233;</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Int J Syst Evol Microbiol</source>
            <pubdate>2003</pubdate>
            <volume>53</volume>
            <fpage>695</fpage>
            <lpage>704</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1099/ijs.0.02346-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">12807189</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Co-linear scaffold of the <it>Bacillus licheniformis </it>and <it>Bacillus subtilis </it>genomes and its use to compare their competence genes.</p>
            </title>
            <aug>
               <au>
                  <snm>Lapidus</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Galleron</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Andersen</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>J&#248;rgensen</snm>
                  <fnm>PL</fnm>
               </au>
               <au>
                  <snm>Ehrlich</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Sorokin</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>FEMS Microbiol Lett</source>
            <pubdate>2002</pubdate>
            <volume>209</volume>
            <fpage>23</fpage>
            <lpage>30</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1097(02)00486-X</pubid>
                  <pubid idtype="pmpid" link="fulltext">12007649</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>The complete genome sequence of the gram-positive bacterium <it>Bacillus subtilis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Kunst</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Ogasawara</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Mozser</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Albertini</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Alloni</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Azebedo</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Bertero</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Bessieres</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Bolotin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Borchert</snm>
                  <fnm>S</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>1997</pubdate>
            <volume>390</volume>
            <fpage>249</fpage>
            <lpage>256</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/36786</pubid>
                  <pubid idtype="pmpid" link="fulltext">9384377</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>DnaA boxes are important elements in setting the initiation mass of <it>Escherichia coli</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Christensen</snm>
                  <fnm>BB</fnm>
               </au>
               <au>
                  <snm>Atlung</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Hansen</snm>
                  <fnm>FG</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1999</pubdate>
            <volume>181</volume>
            <fpage>2683</fpage>
            <lpage>2688</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">93705</pubid>
                  <pubid idtype="pmpid" link="fulltext">10217754</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Interactions of the <it>Streptomyces lividans </it>initiator protein DnaA with its target.</p>
            </title>
            <aug>
               <au>
                  <snm>Majka</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Jakimowicz</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Messer</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Schrempf</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lisowski</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Zakrzewska-Czerwi&#241;ska</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Eur J Biochem</source>
            <pubdate>1999</pubdate>
            <volume>260</volume>
            <fpage>325</fpage>
            <lpage>335</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1432-1327.1999.00168.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">10095766</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Complete genome sequence of the alkaliphilic bacterium <it>Bacillus halodurans </it>and genomic sequence comparison with <it>Bacillus subtilis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Takami</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Nakasone</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Takaki</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Maeno</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Sasaki</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Masui</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Fuji</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Hirama</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Nakamura</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Ogasawara</snm>
                  <fnm>N</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2000</pubdate>
            <volume>28</volume>
            <fpage>4317</fpage>
            <lpage>4331</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">113120</pubid>
                  <pubid idtype="pmpid" link="fulltext">11058132</pubid>
                  <pubid idtype="doi">10.1093/nar/28.21.4317</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Programmed translational frameshifting.</p>
            </title>
            <aug>
               <au>
                  <snm>Farabaugh</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Microbiol Rev</source>
            <pubdate>1996</pubdate>
            <volume>60</volume>
            <fpage>103</fpage>
            <lpage>134</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">239420</pubid>
                  <pubid idtype="pmpid">8852897</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>A complete sequence of the <it>T. tengcongensis </it>genome.</p>
            </title>
            <aug>
               <au>
                  <snm>Bao</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Tian</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Xuan</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Xue</snm>
                  <fnm>Y</fnm>
               </au>
               <etal/>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>689</fpage>
            <lpage>700</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">186588</pubid>
                  <pubid idtype="pmpid" link="fulltext">11997336</pubid>
                  <pubid idtype="doi">10.1101/gr.219302</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Genome sequence of <it>Oceanobacillus iheyensis </it>isolated from the Iheya Ridge and its unexpected adaptive capabilities to extreme environments.</p>
            </title>
            <aug>
               <au>
                  <snm>Takami</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Takaki</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Uchiyama</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2002</pubdate>
            <volume>30</volume>
            <fpage>3927</fpage>
            <lpage>3935</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">137110</pubid>
                  <pubid idtype="pmpid" link="fulltext">12235376</pubid>
                  <pubid idtype="doi">10.1093/nar/gkf526</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Correlation of phylogenetic lineages of group B streptococci, identified by analysis of restriction-digestion patterns of genomic DNA, with <it>infB </it>alleles and mobile genetic elements.</p>
            </title>
            <aug>
               <au>
                  <snm>Takahashi</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Detrick</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Whiting</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Blaschke-Bonkowksy</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Aoyagi</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Adderson</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Bohnsack</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>J Infect Dis</source>
            <pubdate>2002</pubdate>
            <volume>186</volume>
            <fpage>1034</fpage>
            <lpage>1038</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1086/342950</pubid>
                  <pubid idtype="pmpid" link="fulltext">12232847</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Genome sequence and comparative microarray analysis of serotype M18 group A <it>Streptococcus </it>strains associated with acute rheumatic fever outbreaks.</p>
            </title>
            <aug>
               <au>
                  <snm>Smoot</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Barbian</snm>
                  <fnm>KD</fnm>
               </au>
               <au>
                  <snm>Van Gompel</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Smoot</snm>
                  <fnm>LM</fnm>
               </au>
               <au>
                  <snm>Chaussee</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Sylva</snm>
                  <fnm>GL</fnm>
               </au>
               <au>
                  <snm>Sturdevant</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Ricklefs</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Porcella</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Parkins</snm>
                  <fnm>LD</fnm>
               </au>
               <etal/>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2002</pubdate>
            <volume>99</volume>
            <fpage>4668</fpage>
            <lpage>4673</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">123705</pubid>
                  <pubid idtype="pmpid" link="fulltext">11917108</pubid>
                  <pubid idtype="doi">10.1073/pnas.062526099</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Prophages and bacterial genomics: What have we learned so far?</p>
            </title>
            <aug>
               <au>
                  <snm>Casjens</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2003</pubdate>
            <volume>49</volume>
            <fpage>277</fpage>
            <lpage>300</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.2003.03580.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">12886937</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Identification of prokaryotic and eukaryotic signal peptides and prediction of their cleavage sites.</p>
            </title>
            <aug>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Engelbrecht</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Brunak</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>von Heijne</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Protein Eng</source>
            <pubdate>1997</pubdate>
            <volume>10</volume>
            <fpage>1</fpage>
            <lpage>6</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">9051728</pubid>
                  <pubid idtype="doi">10.1093/protein/10.1.1</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Predicting transmembrane protein topology with a hidden Markov model: application to complete genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Krogh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Larsson</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>von Heijne</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Sonnhammer</snm>
                  <fnm>ELL</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>2000</pubdate>
            <volume>305</volume>
            <fpage>567</fpage>
            <lpage>580</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1006/jmbi.2000.4315</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <aug>
               <au>
                  <snm>Sonnenshein</snm>
                  <fnm>AL</fnm>
               </au>
            </aug>
            <source>Bacillus subtilis and Other Gram-Positive Bacteria: Biochemistry, Physiology, and Molecular Genetics</source>
            <publisher>Washington: American Society for Microbiology</publisher>
            <pubdate>1993</pubdate>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Cyclic-imide hydrolyzing activity of D-hydantoinase from <it>Blastobacter </it>sp. Strain A17p-4.</p>
            </title>
            <aug>
               <au>
                  <snm>Soong</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Ogawa</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Honda</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Shimizu</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>1999</pubdate>
            <volume>65</volume>
            <fpage>1459</fpage>
            <lpage>1462</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10103237</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Transformation of <it>Bacillus licheniformis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Gwinn</snm>
                  <fnm>DD</fnm>
               </au>
               <au>
                  <snm>Thorne</snm>
                  <fnm>CB</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1964</pubdate>
            <volume>87</volume>
            <fpage>519</fpage>
            <lpage>526</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">277048</pubid>
                  <pubid idtype="pmpid">14127566</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Factors affecting transformation of <it>Bacillus licheniformis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Thorne</snm>
                  <fnm>CB</fnm>
               </au>
               <au>
                  <snm>Stull</snm>
                  <fnm>HB</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1966</pubdate>
            <volume>91</volume>
            <fpage>1012</fpage>
            <lpage>1020</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">315992</pubid>
                  <pubid idtype="pmpid">5929742</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>The peptide antibiotics of <it>Bacillus</it>: chemistry, biogenesis, and possible functions.</p>
            </title>
            <aug>
               <au>
                  <snm>Katz</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Demain</snm>
                  <fnm>AL</fnm>
               </au>
            </aug>
            <source>Bacteriol Rev</source>
            <pubdate>1977</pubdate>
            <volume>41</volume>
            <fpage>449</fpage>
            <lpage>474</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">414008</pubid>
                  <pubid idtype="pmpid">70202</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Distribution and variation of bacitracin synthetase gene sequences in laboratory stock strains of <it>Bacillus licheniformis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Ishihara</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Takoh</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nishibayashi</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sato</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Curr Microbiol</source>
            <pubdate>2002</pubdate>
            <volume>45</volume>
            <fpage>18</fpage>
            <lpage>23</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00284-001-0041-5</pubid>
                  <pubid idtype="pmpid" link="fulltext">12029522</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Lichenysin - a more efficient cation chelator than surfactin.</p>
            </title>
            <aug>
               <au>
                  <snm>Grangemard</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Wallach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Maget-Dana</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Peypoux</snm>
                  <fnm>F</fnm>
               </au>
            </aug>
            <source>Appl Biochem Biotechnol</source>
            <pubdate>2001</pubdate>
            <volume>90</volume>
            <fpage>199</fpage>
            <lpage>210</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1385/ABAB:90:3:199</pubid>
                  <pubid idtype="pmpid" link="fulltext">11318033</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Genome engineering reveals large dispensable regions in <it>Bacillus subtilis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Westers</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Dorenbos</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>van Dijl</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Kable</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Flanagan</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Devine</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Jude</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>S&#233;ror</snm>
                  <fnm>SJ</fnm>
               </au>
               <au>
                  <snm>Beekman</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Darmon</snm>
                  <fnm>E</fnm>
               </au>
               <etal/>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2003</pubdate>
            <volume>20</volume>
            <fpage>2076</fpage>
            <lpage>2090</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msg219</pubid>
                  <pubid idtype="pmpid" link="fulltext">12949151</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Biosynthesis of the lantibiotic mersacidin: organization of a type B lantibiotic gene cluster.</p>
            </title>
            <aug>
               <au>
                  <snm>Altena</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Guder</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cramer</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Bierbaum</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>2000</pubdate>
            <volume>66</volume>
            <fpage>2565</fpage>
            <lpage>2571</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">110582</pubid>
                  <pubid idtype="pmpid" link="fulltext">10831439</pubid>
                  <pubid idtype="doi">10.1128/AEM.66.6.2565-2571.2000</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Multiple activities in lantibiotics - models for the design of novel antibiotics?</p>
            </title>
            <aug>
               <au>
                  <snm>Pag</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Sahl</snm>
                  <fnm>HG</fnm>
               </au>
            </aug>
            <source>Curr Pharm Des</source>
            <pubdate>2002</pubdate>
            <volume>8</volume>
            <fpage>815</fpage>
            <lpage>833</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.2174/1381612023395439</pubid>
                  <pubid idtype="pmpid" link="fulltext">11945173</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Combination of antibiotic mechanisms in lantibiotics.</p>
            </title>
            <aug>
               <au>
                  <snm>Hoffmann</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Pag</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Wiedemann</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Sahl</snm>
                  <fnm>HG</fnm>
               </au>
            </aug>
            <source>Farmaco</source>
            <pubdate>2002</pubdate>
            <volume>57</volume>
            <fpage>685</fpage>
            <lpage>691</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0014-827X(02)01208-9</pubid>
                  <pubid idtype="pmpid">12361237</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Essential genes in <it>Bacillus subtilis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Kobayashi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ehrlich</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Albertini</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Amati</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Andersen</snm>
                  <fnm>KK</fnm>
               </au>
               <au>
                  <snm>Arnaud</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Asai</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ashikaga</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Aymerch</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Bessieres</snm>
                  <fnm>P</fnm>
               </au>
               <etal/>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2003</pubdate>
            <volume>100</volume>
            <fpage>4678</fpage>
            <lpage>4683</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">153615</pubid>
                  <pubid idtype="pmpid" link="fulltext">12682299</pubid>
                  <pubid idtype="doi">10.1073/pnas.0730515100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Cytotoxic potential of industrial strains of <it>Bacillus </it>sp.</p>
            </title>
            <aug>
               <au>
                  <snm>Pedersen</snm>
                  <fnm>PB</fnm>
               </au>
               <au>
                  <snm>Bj&#248;rnvad</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Rasmussen</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Petersen</snm>
                  <fnm>JN</fnm>
               </au>
            </aug>
            <source>Regul Toxicol Pharmacol</source>
            <pubdate>2002</pubdate>
            <volume>36</volume>
            <fpage>155</fpage>
            <lpage>161</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">12460750</pubid>
                  <pubid idtype="doi">10.1006/rtph.2002.1574</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Toxigenic strains of <it>Bacillus licheniformis </it>related to food poisoning.</p>
            </title>
            <aug>
               <au>
                  <snm>Salkinoja-Salonen</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Vuorio</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Andersson</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>K&#228;mpfer</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Andersson</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Honkanen-Buzalski</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Scoging</snm>
                  <fnm>AC</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>1999</pubdate>
            <volume>65</volume>
            <fpage>4637</fpage>
            <lpage>4645</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">91618</pubid>
                  <pubid idtype="pmpid" link="fulltext">10508100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Identification and molecular characterization of the genetic locus for biosynthesis of the emetic toxin, cereulide, of <it>Bacillus cereus</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Agata</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Ohta</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Abstr Ann Meeting Am Soc Microbiol</source>
            <pubdate>2002</pubdate>
            <volume>102</volume>
            <fpage>374</fpage>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Contribution to phenotypic and genotypic characterization of <it>Bacillus licheniformis </it>and description of new genomovars.</p>
            </title>
            <aug>
               <au>
                  <snm>Manachini</snm>
                  <fnm>PL</fnm>
               </au>
               <au>
                  <snm>Fortina</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Levati</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Parini</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Syst Appl Microbiol</source>
            <pubdate>1998</pubdate>
            <volume>21</volume>
            <fpage>520</fpage>
            <lpage>529</lpage>
            <xrefbib>
               <pubid idtype="pmpid">9924820</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Genotypic diversity among <it>Bacillus licheniformis </it>strains from various sources.</p>
            </title>
            <aug>
               <au>
                  <snm>De Clerck</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>De Vos</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>FEMS Microbiol Lett</source>
            <pubdate>2004</pubdate>
            <volume>231</volume>
            <fpage>91</fpage>
            <lpage>98</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1097(03)00935-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">14769472</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Shotgun sequencing.</p>
            </title>
            <aug>
               <au>
                  <snm>Wilson</snm>
                  <fnm>RK</fnm>
               </au>
               <au>
                  <snm>Mardis</snm>
                  <fnm>ER</fnm>
               </au>
            </aug>
            <source>In Genome Analysis: A Laboratory Manual</source>
            <publisher>Cold Spring Harbor: Cold Spring Harbor Press</publisher>
            <editor>Birren B, Green ED, Meyers RM, Roskams J</editor>
            <pubdate>1997</pubdate>
            <volume>1</volume>
            <fpage>397</fpage>
            <lpage>454</lpage>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Stable propagation of cosmid sized human DNA inserts in an F factor based vector.</p>
            </title>
            <aug>
               <au>
                  <snm>Kim</snm>
                  <fnm>UJ</fnm>
               </au>
               <au>
                  <snm>Shizuya</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>de Jong</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Birren</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Simon</snm>
                  <fnm>MI</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1992</pubdate>
            <volume>20</volume>
            <fpage>1083</fpage>
            <lpage>1085</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">312094</pubid>
                  <pubid idtype="pmpid">1549470</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Phred, Phrap, and Consed</p>
            </title>
            <url>http://www.phrap.org/phredphrapconsed.html</url>
         </bibl>
         <bibl id="B42">
            <title>
               <p>EasyGene - a prokaryotic gene finder that ranks ORFs by statistical significance.</p>
            </title>
            <aug>
               <au>
                  <snm>Larsen</snm>
                  <fnm>TS</fnm>
               </au>
               <au>
                  <snm>Krogh</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>4</volume>
            <fpage>21</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1186/1471-2105-4-21</pubid>
                  <pubid idtype="pmpid" link="fulltext">12783628</pubid>
                  <pubid idtype="pmcid">521197</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>Improved microbial gene identification with GLIMMER.</p>
            </title>
            <aug>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Harmon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kasif</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1999</pubdate>
            <volume>27</volume>
            <fpage>4636</fpage>
            <lpage>4641</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">148753</pubid>
                  <pubid idtype="pmpid" link="fulltext">10556321</pubid>
                  <pubid idtype="doi">10.1093/nar/27.23.4636</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>FrameD: a flexible program for quality check and gene prediction in prokaryotic genomes and noisy matured eukaryotic sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Schiex</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Gouzy</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Moisan</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>de Oliveira</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2003</pubdate>
            <volume>31</volume>
            <fpage>3738</fpage>
            <lpage>3741</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">169016</pubid>
                  <pubid idtype="pmpid" link="fulltext">12824407</pubid>
                  <pubid idtype="doi">10.1093/nar/gkg610</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>A probabilistic, method for identifying start codons in bacterial genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Suzek</snm>
                  <fnm>BE</fnm>
               </au>
               <au>
                  <snm>Ermolaeva</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Schreiber</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2001</pubdate>
            <volume>17</volume>
            <fpage>1123</fpage>
            <lpage>1130</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/17.12.1123</pubid>
                  <pubid idtype="pmpid" link="fulltext">11751220</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Translation in <it>Bacillus subtilis</it>: roles and trends of initiation and termination, insights from a genome analysis.</p>
            </title>
            <aug>
               <au>
                  <snm>Rocha</snm>
                  <fnm>EPC</fnm>
               </au>
               <au>
                  <snm>Danchin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Viari</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1999</pubdate>
            <volume>27</volume>
            <fpage>3567</fpage>
            <lpage>3576</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">148602</pubid>
                  <pubid idtype="pmpid" link="fulltext">10446248</pubid>
                  <pubid idtype="doi">10.1093/nar/27.17.3567</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>The Protein Information Resource: an integrated public resource of functional annotation of proteins.</p>
            </title>
            <aug>
               <au>
                  <snm>Wu</snm>
                  <fnm>CH</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Arminski</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Castro-Alvear</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>ZZ</fnm>
               </au>
               <au>
                  <snm>Ledley</snm>
                  <fnm>RS</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>KC</fnm>
               </au>
               <au>
                  <snm>Mewes</snm>
                  <fnm>HW</fnm>
               </au>
               <au>
                  <snm>Orcutt</snm>
                  <fnm>BC</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2002</pubdate>
            <volume>30</volume>
            <fpage>35</fpage>
            <lpage>37</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">99125</pubid>
                  <pubid idtype="pmpid" link="fulltext">11752247</pubid>
                  <pubid idtype="doi">10.1093/nar/30.1.35</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>SubtiList</p>
            </title>
            <url>http://genolist.pasteur.fr/SubtiList/genome.cgi</url>
         </bibl>
         <bibl id="B49">
            <title>
               <p>InterProScan - an integration platform for the signature-recognition methods in InterPro.</p>
            </title>
            <aug>
               <au>
                  <snm>Zdobnov</snm>
                  <fnm>EM</fnm>
               </au>
               <au>
                  <snm>Apweiler</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2001</pubdate>
            <volume>17</volume>
            <fpage>847</fpage>
            <lpage>848</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/17.9.847</pubid>
                  <pubid idtype="pmpid" link="fulltext">11590104</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>The Pfam protein families database.</p>
            </title>
            <aug>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Coin</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Durbin</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Finn</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Hollich</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Griffiths-Jones</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Khanna</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sonnhammer</snm>
                  <fnm>EL</fnm>
               </au>
               <au>
                  <snm>Studholme</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Yeats</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32 Database issue</volume>
            <fpage>D138</fpage>
            <lpage>D141</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid" link="fulltext">14681378</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh121</pubid>
                  <pubid idtype="pmcid">308855</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>The TIGRFAMs database of protein families.</p>
            </title>
            <aug>
               <au>
                  <snm>Haft</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Selengut</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2003</pubdate>
            <volume>31</volume>
            <fpage>371</fpage>
            <lpage>373</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">165575</pubid>
                  <pubid idtype="pmpid" link="fulltext">12520025</pubid>
                  <pubid idtype="doi">10.1093/nar/gkg128</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>The InterPro database, an integrated documentation resource for protein families, domains and functional sites.</p>
            </title>
            <aug>
               <au>
                  <snm>Apweiler</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Attwood</snm>
                  <fnm>TK</fnm>
               </au>
               <au>
                  <snm>Bairock</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bateman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Biswas</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bucher</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Cerutti</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Corpet</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Croning</snm>
                  <fnm>MD</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2001</pubdate>
            <volume>29</volume>
            <fpage>37</fpage>
            <lpage>40</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">29841</pubid>
                  <pubid idtype="pmpid" link="fulltext">11125043</pubid>
                  <pubid idtype="doi">10.1093/nar/29.1.37</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>COG</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/COG</url>
         </bibl>
         <bibl id="B54">
            <title>
               <p>A genomic perspective on protein families.</p>
            </title>
            <aug>
               <au>
                  <snm>Tatusov</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1997</pubdate>
            <volume>278</volume>
            <fpage>631</fpage>
            <lpage>637</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.278.5338.631</pubid>
                  <pubid idtype="pmpid" link="fulltext">9381173</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <aug>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
               <au>
                  <snm>Galperin</snm>
                  <fnm>MY</fnm>
               </au>
            </aug>
            <source>Sequence - Evolution - Function: Computational Approaches in Comparative Genomics</source>
            <publisher>Boston: Kluwer</publisher>
            <pubdate>2002</pubdate>
         </bibl>
         <bibl id="B56">
            <title>
               <p>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence.</p>
            </title>
            <aug>
               <au>
                  <snm>Lowe</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <fpage>955</fpage>
            <lpage>964</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">146525</pubid>
                  <pubid idtype="pmpid" link="fulltext">9023104</pubid>
                  <pubid idtype="doi">10.1093/nar/25.5.955</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>BSORF top page</p>
            </title>
            <url>http://bacillus.genome.jp</url>
         </bibl>
         <bibl id="B58">
            <title>
               <p>bacsu</p>
            </title>
            <url>http://www.expasy.org/cgi-bin/lists?bacsu.txt</url>
         </bibl>
         <bibl id="B59">
            <title>
               <p>The generic genome browser: a building block for a model organism system database.</p>
            </title>
            <aug>
               <au>
                  <snm>Stein</snm>
                  <fnm>LD</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Shu</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Caudy</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Mangone</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Day</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Nickerson</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Stajich</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Harris</snm>
                  <fnm>TW</fnm>
               </au>
               <au>
                  <snm>Arva</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>1599</fpage>
            <lpage>1610</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">187535</pubid>
                  <pubid idtype="pmpid" link="fulltext">12368253</pubid>
                  <pubid idtype="doi">10.1101/gr.403602</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>BACSAP home</p>
            </title>
            <url>http://63.198.8.200</url>
         </bibl>
         <bibl id="B61">
            <title>
               <p>The genome sequence of <it>Bacillus anthracis </it>Ames and comparison to closely related bacteria.</p>
            </title>
            <aug>
               <au>
                  <snm>Read</snm>
                  <fnm>TD</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Tourasse</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Baillie</snm>
                  <fnm>LW</fnm>
               </au>
               <au>
                  <snm>Paulsen</snm>
                  <fnm>IT</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>Tettelin</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Fouts</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Eisen</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Gill</snm>
                  <fnm>SR</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2003</pubdate>
            <volume>423</volume>
            <fpage>81</fpage>
            <lpage>86</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01586</pubid>
                  <pubid idtype="pmpid" link="fulltext">12721629</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Genome sequence of <it>Bacillus cereus </it>and comparative analysis with <it>Bacillus anthracis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Ivanova</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sorokin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Anderson</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Galleron</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Candelon</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kapatral</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Bhattacharyya</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Reznik</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Mikhailova</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Lapidus</snm>
                  <fnm>A</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2003</pubdate>
            <volume>423</volume>
            <fpage>87</fpage>
            <lpage>91</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01582</pubid>
                  <pubid idtype="pmpid" link="fulltext">12721630</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
