<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-9-271</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>The genome of the versatile nitrogen fixer <it>Azorhizobium caulinodans </it>ORS571</p>
         </title>
         <aug>
            <au id="A1" ce="yes">
               <snm>Lee</snm>
               <fnm>Kyung-Bum</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>kyulee@genes.nig.ac.jp</email>
            </au>
            <au id="A2" ce="yes">
               <snm>De Backer</snm>
               <fnm>Philippe</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>phbac@psb.ugent.be</email>
            </au>
            <au id="A3">
               <snm>Aono</snm>
               <fnm>Toshihiro</fnm>
               <insr iid="I1"/>
               <email>uaono@mail.ecc.u-tokyo.ac.jp</email>
            </au>
            <au id="A4">
               <snm>Liu</snm>
               <fnm>Chi-Te</fnm>
               <insr iid="I1"/>
               <email>aericliu@mail.ecc.u-tokyo.ac.jp</email>
            </au>
            <au id="A5">
               <snm>Suzuki</snm>
               <fnm>Shino</fnm>
               <insr iid="I1"/>
               <email>ushino@mail.ecc.u-tokyo.ac.jp</email>
            </au>
            <au id="A6">
               <snm>Suzuki</snm>
               <fnm>Tadahiro</fnm>
               <insr iid="I1"/>
               <email>taboengine@yahoo.co.jp</email>
            </au>
            <au id="A7">
               <snm>Kaneko</snm>
               <fnm>Takakazu</fnm>
               <insr iid="I5"/>
               <email>kaneko@kazusa.or.jp</email>
            </au>
            <au id="A8">
               <snm>Yamada</snm>
               <fnm>Manabu</fnm>
               <insr iid="I5"/>
               <email>myamada@kazusa.or.jp</email>
            </au>
            <au id="A9">
               <snm>Tabata</snm>
               <fnm>Satoshi</fnm>
               <insr iid="I5"/>
               <email>tabata@kazusa.or.jp</email>
            </au>
            <au id="A10">
               <snm>Kupfer</snm>
               <mi>M</mi>
               <fnm>Doris</fnm>
               <insr iid="I6"/>
               <email>doris.kupfer@faa.gov</email>
            </au>
            <au id="A11">
               <snm>Najar</snm>
               <mi>Z</mi>
               <fnm>Fares</fnm>
               <insr iid="I6"/>
               <email>fznajar@ou.edu</email>
            </au>
            <au id="A12">
               <snm>Wiley</snm>
               <mi>B</mi>
               <fnm>Graham</fnm>
               <insr iid="I6"/>
               <email>graham.b.wileyl-1@ou.edu</email>
            </au>
            <au id="A13">
               <snm>Roe</snm>
               <fnm>Bruce</fnm>
               <insr iid="I6"/>
               <email>broe@ou.edu</email>
            </au>
            <au id="A14">
               <snm>Binnewies</snm>
               <mi>T</mi>
               <fnm>Tim</fnm>
               <insr iid="I7"/>
               <email>tim@cbs.dtu.dk</email>
            </au>
            <au id="A15">
               <snm>Ussery</snm>
               <mi>W</mi>
               <fnm>David</fnm>
               <insr iid="I7"/>
               <email>dave@cbs.dtu.dk</email>
            </au>
            <au id="A16">
               <snm>D'Haeze</snm>
               <fnm>Wim</fnm>
               <insr iid="I4"/>
               <email>dhaeze.wim@gmail.com</email>
            </au>
            <au id="A17">
               <snm>Den Herder</snm>
               <fnm>Jeroen</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>jeroendh11@gmail.com</email>
            </au>
            <au id="A18">
               <snm>Gevers</snm>
               <fnm>Dirk</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <insr iid="I8"/>
               <email>digev@mit.edu</email>
            </au>
            <au id="A19">
               <snm>Vereecke</snm>
               <fnm>Danny</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>danny.vereecke@psb.ugent.be</email>
            </au>
            <au id="A20">
               <snm>Holsters</snm>
               <fnm>Marcelle</fnm>
               <insr iid="I3"/>
               <insr iid="I4"/>
               <email>marcelle.holsters@psb.ugent.be</email>
            </au>
            <au id="A21" ca="yes">
               <snm>Oyaizu</snm>
               <fnm>Hiroshi</fnm>
               <insr iid="I1"/>
               <email>aoyaizu@mail.ecc.u-tokyo.ac.jp</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Laboratory of Plant Biotechnology, Biotechnology Research Center, University of Tokyo, Tokyo 113-8657, Japan</p>
            </ins>
            <ins id="I2">
               <p>Center for Information Biology and DNA Data Bank of Japan, National Institute of Genetics, Mishima 411-8540, Japan</p>
            </ins>
            <ins id="I3">
               <p>Department of Plant Systems Biology, Flanders Institute for Biotechnology (VIB), 9052 Gent, Belgium</p>
            </ins>
            <ins id="I4">
               <p>Department of Molecular Genetics, Ghent University, 9052 Gent, Belgium</p>
            </ins>
            <ins id="I5">
               <p>Kazusa DNA Research Institute, Chiba 292-0818, Japan</p>
            </ins>
            <ins id="I6">
               <p>Department of Chemistry and Biochemistry, University of Oklahoma, Norman, OK 73019-3051, USA</p>
            </ins>
            <ins id="I7">
               <p>Center for Biological Sequence Analysis, Technical University of Denmark, 2800 Lyngby, Denmark</p>
            </ins>
            <ins id="I8">
               <p>Department of Civil and Environmental Engineering, Massachusetts Institute of Technology, Cambridge, MA 02139-4307, USA</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>1</issue>
         <fpage>271</fpage>
         <url>http://www.biomedcentral.com/1471-2164/9/271</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">18522759</pubid>
               <pubid idtype="doi">10.1186/1471-2164-9-271</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>28</day>
               <month>1</month>
               <year>2008</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>04</day>
               <month>6</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>04</day>
               <month>6</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>Lee et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Biological nitrogen fixation is a prokaryotic process that plays an essential role in the global nitrogen cycle. <it>Azorhizobium caulinodans </it>ORS571 has the dual capacity to fix nitrogen both as free-living organism and in a symbiotic interaction with <it>Sesbania rostrata</it>. The host is a fast-growing, submergence-tolerant tropical legume on which <it>A. caulinodans </it>can efficiently induce nodule formation on the root system and on adventitious rootlets located on the stem.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The 5.37-Mb genome consists of a single circular chromosome with an overall average GC of 67% and numerous islands with varying GC contents. Most nodulation functions as well as a putative type-IV secretion system are found in a distinct symbiosis region. The genome contains a plethora of regulatory and transporter genes and many functions possibly involved in contacting a host. It potentially encodes 4717 proteins of which 96.3% have homologs and 3.7% are unique for <it>A. caulinodans</it>. Phylogenetic analyses show that the diazotroph <it>Xanthobacter autotrophicus </it>is the closest relative among the sequenced genomes, but the synteny between both genomes is very poor.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>The genome analysis reveals that <it>A. caulinodans </it>is a diazotroph that acquired the capacity to nodulate most probably through horizontal gene transfer of a complex symbiosis island. The genome contains numerous genes that reflect a strong adaptive and metabolic potential. These combined features and the availability of the annotated genome make <it>A. caulinodans </it>an attractive organism to explore symbiotic biological nitrogen fixation beyond leguminous plants.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Biological nitrogen fixation is carried out by a limited number of prokaryotes that all possess a nitrogenase enzyme complex that reduces molecular dinitrogen to ammonia. Nitrogen-fixing bacteria can be divided in two major groups: free-living nitrogen fixers or diazotrophs that directly assimilate ammonia for growth and symbiotic nitrogen fixers that pass ammonia to a eukaryotic host and indirectly profit from nitrogen fixation by occupying a particular ecological niche or by supporting the population through better feeding. In the latter group, the symbiosis between leguminous crop plants and rhizobia is of great importance for agriculture. The term "rhizobia" is used for bacteria that induce the formation of new organs, nodules, on the roots of a specific legume host. Inside the nodule, rhizobia are internalized in plant cells where they differentiate into nitrogen-fixing bacteroids [for a recent review on legume nodulation, see <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>].</p>
         <p>Nitrogen-fixing nodules typically occur on roots; however, some members of the subfamilies Papilionoideae (<it>Aeschenomyne </it>sp., <it>Sesbania </it>sp., and <it>Discolobium pulchellum</it>) and Mimosoideae (<it>Neptunia oleracea</it>) form stem-located, aerial nodules <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>. These legumes grow in waterlogged soils of tropical regions and are characterized by dormant, stem-located adventitious root primordia that can develop into stem nodules upon inoculation with an appropriate microbial partner. Although stem and root nodulation are similar, in the latter the nodular vascular system is connected to that of the stem via the vascular bundles of the adventitious root primordium <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>.</p>
         <p>A particularly well-studied case of stem nodulation occurs in <it>Sesbania rostrata </it>Brem. upon inoculation with the microsymbiont <it>Azorhizobium caulinodans </it><abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. <it>S. rostrata</it>, a fast-growing annual shrub from the Sahel region of West-Africa, carries numerous adventitious root primordia that protrude through the stem cortex and epidermis, creating a circular fissure, where bacteria can invade and proliferate <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. The growth properties and the high rate of nitrogen fixation of stem-nodulated plants make <it>S. rostrata </it>well fit as green manure in rice cultivation and, possibly, as a pioneer plant for wetland improvement <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>.</p>
         <p>The bacterium, isolated from stem nodules <abbrgrp><abbr bid="B4">4</abbr></abbrgrp> and originally designated <it>Rhizobium </it>sp. strain ORS571, was renamed <it>Azorhizobium caulinodans </it>inspired by the stem (cauli-)nodulating capacity and by the diazotrophic properties of the strain (azo-rhizobium). Its host range for effective nodulation is very narrow: although nodulation of several <it>Sesbania </it>sp. has been reported, nitrogen-fixing nodules are formed only on <it>S. rostrata </it>and <it>S. punctata </it><abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. <it>A. caulinodans </it>also induces Fix nodules on <it>Phaseolus vulgaris </it>and <it>Leucaena leucocephala </it><abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Two features distinguish <it>A. caulinodans </it>from other rhizobia: its taxonomic position and its dual capacity for free-living and symbiotic nitrogen fixation. The latter is exceptional <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> and implies a regulatory mechanism to either assimilate the ammonia or donate it to the plant in the symbiotic interaction. The first taxonomic study of <it>A. caulinodans </it>strain ORS571 <abbrgrp><abbr bid="B10">10</abbr></abbrgrp> showed that it belongs to the <it>Rhodopseudomonas palustris </it>rRNA branch of purple bacteria, but that it is quite distinct from both <it>Rhodopseudomonas </it>and <it>Bradyrhizobium </it>spp. Based on numerical analysis of phenotypes, protein patterns, and DNA-DNA and DNA-rRNA hybridizations, <it>A. caulinodans </it>was considered as a separate genus with <it>Xanthobacter </it>as closest relative <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. <it>Xanthobacter </it>sp. are diazotrophic bacteria found in diverse soil habitats and in association with rice (<it>Oryza sativa</it>) roots <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr></abbrgrp>. Comparison of 16S rRNA sequences indicated that <it>X. flavus </it>and <it>A. caulinodans </it>are strongly related <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>.</p>
         <p>Here, we present the genome sequence of the <it>A. caulinodans </it>strain ORS571 and discuss the annotation in function of the organism's biology with reference to comparative genomics. This information will stimulate the research on an organism that has real potential for novel applications in agriculture.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Genome organization</p>
            </st>
            <p>Sequencing of the genome of <it>A. caulinodans </it>strain ORS571 (hereafter designated <it>A. caulinodans</it>) revealed a single circular chromosome of 5,369,772 base pairs <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. Relevant genome features generated with the BLASTatlas tool <abbrgrp><abbr bid="B16">16</abbr></abbrgrp> are presented in Figure <figr fid="F1">1</figr> and can be viewed in detail as a web-based resource <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>. The putative origin of replication was predicted based on the position of a GC skew shift (Figure <figr fid="F1">1</figr>) <abbrgrp><abbr bid="B18">18</abbr></abbrgrp> and coincided with the occurrence of a gene cluster typically associated with origins of replication in circular chromosomes of &#945;-proteobacteria (Figure <figr fid="F2">2A</figr>) <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. The specific distribution and orientation of the FtsK Orienting Polar Sequences (KOPS) motif 5'-GGGNAGGG-3', which is involved in loading the FtsK DNA translocase and directing it to the replication terminus in &#945;-proteobacteria <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>, confirmed the predicted location of the origin between AZC_4717 and AZC_0001 (Figure <figr fid="F2">2B</figr>).</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Snapshot of the output generated after analysis of the <it>A. caulinodans </it>genome with the Genome Atlas tool</p>
               </caption>
               <text>
                  <p><b>Snapshot of the output generated after analysis of the <it>A. caulinodans </it>genome with the Genome Atlas tool</b>. The output is accessible as a web-based resource [17] that can can be used as a tool to zoom in on specific regions of interest. Hits within the UNIPROT database, a comparison at the protein level between 14 &#945;-proteobacteria and <it>A. caulinodans</it>, and the synteny between these genomes, the genome annotation, and structural features are represented. The origin and terminus of replication are indicated and the symbiotic region is boxed. From the outer to the inner circle: circle 1, protein hits in the UNIPROT database; circle 2, synteny between 15 &#945;-proteobacterial genomes; circle 3, <it>Agrobacterium tumefaciens </it>C58; circle 4, <it>Xanthobacter autotrophicus </it>Py2; circle 5, <it>Sinorhizobium meliloti </it>1021; circle 6, <it>Bradyrhizobium japonicum </it>USDA 110; circle 7, <it>Rhizobium leguminosarum </it>3841; circle 8, <it>Rhizobium etli </it>CFN42; circles 9 and 10, <it>Mesorhizobium loti </it>strains BNC1 and MAFF303099, respectively; circle 11, <it>Nitrobacter winogradskyi </it>Nb225; circles 12, 13, 14, 15, and 16, <it>Rhodopseudomonas palustris </it>strains CGA009, HaA2, BisA53, BisB18, and BisB5, respectively; circle 17, intrinsic curvature; circle 18, stacking energy; circle 19, position preference; circle 20, genome annotation; circle 21, global repeats; circle 22, inverted repeats; circle 23, GC skew; circle 24, percent AT. The structural DNA parameters in circles 21 and 22 relate to the occurrence of repeats that might indicate inserted sequences, and circles 18 and 19 designate the accessibility and flexibility of the DNA as a measure for the capacity to interact with proteins.</p>
               </text>
               <graphic file="1471-2164-9-271-1"/>
            </fig>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Predicted position of the origin of replication</p>
               </caption>
               <text>
                  <p><b>Predicted position of the origin of replication</b>. A. Conservation of a cluster of 12 genes located around the origin of replication in several &#945;-proteobacteria: (1) <it>Azorhizobium caulinodans</it>, (2) <it>Agrobacterium tumefaciens</it>, <it>Sinorhizobium meliloti</it>, <it>Rhizobium leguminosarum</it>, and <it>Rhizobium etli</it>, (3) <it>Mesorhizobium loti</it>, <it>Brucella abortus</it>, and <it>Brucella suis</it>, (4) <it>Bradyrhizobium japonicum </it>and <it>Rhodopseudomonas palustris</it>, (5) <it>Caulobacter crescentus</it>, and (6) <it>Xanthobacter autotrophicus</it>. The putative proteins and the origin of replication are indicated. B. Cumulative distribution in forward and reverse orientation of the 8-base KOPS motif 5'-GGGNAGGG-3' in the genome of <it>A. caulinodans</it>. The orientation of this motif is strongly biased toward <it>dif </it>sites at the terminus of replication (Terminus).</p>
               </text>
               <graphic file="1471-2164-9-271-2"/>
            </fig>
            <p>Although the overall GC content of the <it>A. caulinodans </it>genome is 67% and the average GC incidence at the third position of the codon (GC3) is 85%, the chromosome has many islands of varying size with different GC (Figure <figr fid="F3">3A</figr>) and GC3 contents (Figure <figr fid="F3">3B</figr>). In accordance with the overall high GC content, the codon usage is shifted toward GC-rich codons (Figure <figr fid="F4">4A</figr>) and, consequently, GC-coded amino acids are overrepresented (Figure <figr fid="F4">4B</figr>).</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Nucleotide composition of the <it>A. caulinodans </it>genome</p>
               </caption>
               <text>
                  <p><b>Nucleotide composition of the <it>A. caulinodans </it>genome</b>. The GC and GC3 contents for each open reading frame were calculated and positioned on the genome. Every gene was classified in one of four classes: orphans, genes of the <it>A. caulinodans </it>genome without homolog in other bacteria of the data set (44 genomes) (red squares); singletons, genes with one representative in <it>A. caulinodans </it>and homologs in the data set (green stars); phage- or integrase-related genes (yellow triangles); duplicated genes with more than one paralog in the <it>A. caulinodans </it>genome (blue diamonds). GC (A) and GC3 (B) distribution across the genome; GC (C) and GC3 (D) distribution across the symbiotic region. Circles (C and D) indicate the location of the three <it>nod </it>loci.</p>
               </text>
               <graphic file="1471-2164-9-271-3"/>
            </fig>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Codon (A) and amino acid (B) usage in the <it>A. caulinodans </it>genome (red) and the symbiotic region (blue)</p>
               </caption>
               <text>
                  <p>
                     <b>Codon (A) and amino acid (B) usage in the <it>A. caulinodans </it>genome (red) and the symbiotic region (blue).</b>
                  </p>
               </text>
               <graphic file="1471-2164-9-271-4"/>
            </fig>
            <p>Combined computer prediction and similarity searches (Methods) revealed 4717 protein-encoding genes with an average coding density of one gene in every 1123 bp (89%). With the BLASTP program (Methods), the amino acid sequences were compared with the sequences in the nonredundant protein database at NCBI. A putative function could be assigned to 3588 genes (76.1%), 954 genes (20.2%) were similar to hypothetical genes, and the remaining 175 (3.7%) had no significant similarity to any registered gene (Figure <figr fid="F1">1</figr>; Table <tblr tid="T1">1</tblr>; Additional file <supplr sid="S1">1</supplr>).</p>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p><b>Overview of the genes, their properties, and translation products present in the genome of <it>A. caulinodans</it></b>. From left to right: unique ID for each <it>A. caulinodans </it>gene; indication of the gene function based on homology; functional classification of genes according to Riley <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>; GC content at the third position of codons in percent; GC content of a gene in percent; start/stop, position of start codon or stop codon of a gene on the plus or minus strand, respectively; stop/start, position of stop codon or start codon of a gene on the plus or minus strand, respectively; strand, coding sequence on the plus or minus strand; protein sequence.</p>
               </text>
               <file name="1471-2164-9-271-S1.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Overview of the functional categories of proteins present in the <it>A. caulinodans </it>genome according to the classification of Riley [26].</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>Functional classification</p>
                     </c>
                     <c ca="left">
                        <p>No.<sup>a</sup></p>
                     </c>
                     <c ca="left">
                        <p>%<sup>b</sup></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Amino acid biosynthesis</p>
                     </c>
                     <c ca="left">
                        <p>132</p>
                     </c>
                     <c ca="left">
                        <p>2.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Biosynthesis of cofactors, prosthetic groups and carriers</p>
                     </c>
                     <c ca="left">
                        <p>159</p>
                     </c>
                     <c ca="left">
                        <p>3.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cell envelope</p>
                     </c>
                     <c ca="left">
                        <p>174</p>
                     </c>
                     <c ca="left">
                        <p>3.7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cellular processes</p>
                     </c>
                     <c ca="left">
                        <p>200</p>
                     </c>
                     <c ca="left">
                        <p>4.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Central intermediary metabolism</p>
                     </c>
                     <c ca="left">
                        <p>161</p>
                     </c>
                     <c ca="left">
                        <p>3.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Energy metabolism</p>
                     </c>
                     <c ca="left">
                        <p>303</p>
                     </c>
                     <c ca="left">
                        <p>6.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Fatty acid, phopholipid, and sterol metabolism</p>
                     </c>
                     <c ca="left">
                        <p>136</p>
                     </c>
                     <c ca="left">
                        <p>2.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Purines, pyrimidines, nucleosides, and nucleotides</p>
                     </c>
                     <c ca="left">
                        <p>66</p>
                     </c>
                     <c ca="left">
                        <p>1.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Regulatory function</p>
                     </c>
                     <c ca="left">
                        <p>384</p>
                     </c>
                     <c ca="left">
                        <p>8.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>DNA replication, recombination and repair</p>
                     </c>
                     <c ca="left">
                        <p>79</p>
                     </c>
                     <c ca="left">
                        <p>1.7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transcription</p>
                     </c>
                     <c ca="left">
                        <p>49</p>
                     </c>
                     <c ca="left">
                        <p>1.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Signal transduction</p>
                     </c>
                     <c ca="left">
                        <p>39</p>
                     </c>
                     <c ca="left">
                        <p>0.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Translation</p>
                     </c>
                     <c ca="left">
                        <p>227</p>
                     </c>
                     <c ca="left">
                        <p>4.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Transport and binding proteins</p>
                     </c>
                     <c ca="left">
                        <p>714</p>
                     </c>
                     <c ca="left">
                        <p>15.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Other categories</p>
                     </c>
                     <c ca="left">
                        <p>765</p>
                     </c>
                     <c ca="left">
                        <p>16.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Hypothetical protein</p>
                     </c>
                     <c ca="left">
                        <p>954</p>
                     </c>
                     <c ca="left">
                        <p>20.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Unknown protein</p>
                     </c>
                     <c ca="left">
                        <p>175</p>
                     </c>
                     <c ca="left">
                        <p>3.7</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="left">
                        <p>4717</p>
                     </c>
                     <c ca="left">
                        <p>100.0</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a </sup>Number of proteins that belong to a specific class.</p>
                  <p><sup>b </sup>Percentage of total proteins that belong to a specific class.</p>
               </tblfn>
            </tbl>
            <p>Three rRNA clusters are ordered as 5S-23S-16S (located between the protein-coding genes AZC_0613-AZC_0614, AZC_4195-AZC_4196, and AZC_4435-AZC_4436) and all have an insertion of a tRNA-Ile and a tRNA-Ala between the 16S and 23S genes. A total of 53 tRNA genes representing 44 tRNA species for all 20 amino acids were assigned by sequence similarity and computer prediction with the tRNAscan-SE program <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>. Most of the tRNA genes are dispersed on the genome and are probably transcribed as single units. Thirty out of 57 ribosomal protein genes occur in a cluster (AZC_2529-AZC_2559), whereas the others are scattered over the genome (Additional file <supplr sid="S1">1</supplr>).</p>
         </sec>
         <sec>
            <st>
               <p>Phylogeny and comparative genomics</p>
            </st>
            <p>For phylogenetic analysis (Methods), the genomes of <it>A. caulinodans </it>and of 44 &#945;-proteobacteria were compared (Additional file <supplr sid="S2">2</supplr>). The data set was assembled based on the available complete genome sequences (closure date August 15, 2007) and ecological or phylogenetic relatedness. The resulting maximum-likelihood tree (Figure <figr fid="F5">5A</figr>) showed a great concordance with &#945;-proteobacterial trees based on complete 16S rRNA genes <abbrgrp><abbr bid="B22">22</abbr></abbrgrp> or sets of protein families <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. Our analysis placed <it>A. caulinodans </it>closest to <it>X. autotrophicus</it>, <it>Nitrobacter winogradskyi</it>, <it>Rhodopseudomonas palustris</it>, and <it>Bradyrhizobium japonicum</it>, consistent with previous taxonomic studies <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B13">13</abbr></abbrgrp>. With <it>A. caulinodans </it>as a reference genome, a graphical representation of the BLAST hits of the proteins encoded by the genomes of the 13 closest relatives was generated with the BLASTatlas tool (Figure <figr fid="F1">1</figr>) <abbrgrp><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr></abbrgrp>.</p>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p><b>Overview of the properties of the 45 &#945;-proteobacterial genomes of the data set</b>. From left to right: bacterial strain; type of replicon; NCBI database identification code; size in Mbp; GC content of the replicon; number of proteins encoded by the replicon; number of structural RNA elements on the replicon.</p>
               </text>
               <file name="1471-2164-9-271-S2.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Maximum-likelihood tree and prevalence of duplicated, singleton, and orphan genes within 45 complete &#945;-proteobacterial genome sequences</p>
               </caption>
               <text>
                  <p><b>Maximum-likelihood tree and prevalence of duplicated, singleton, and orphan genes within 45 complete &#945;-proteobacterial genome sequences</b>. A. Unrooted maximum-likelihood tree based on 108 conserved protein sequences (for construction of the tree and references to the genomes, see Methods and Additional file <supplr sid="S2">2</supplr>, respectively). Bootstraps are 100, unless indicated otherwise. B. Percentual presence of the four gene categories: orphans (dark blue); singletons (cyan); phage- or integrase-related genes (red); and duplicated genes or paralogs (light blue). Genome sizes are indicated on the right.</p>
               </text>
               <graphic file="1471-2164-9-271-5"/>
            </fig>
            <p>For a broader view of the gene relationships, the occurrence and organization of the proteins encoded by these 45 genomes were evaluated (Methods). Each gene of a total data set of 146,315 was classified in one of four groups: orphans, genes without homologs in other bacteria of the data set; singletons, genes with one representative in the genome and homologs in other genomes; phage or integrase-related genes; and duplicated genes or paralogs with more than one paralog in the genome. The distribution of each of these categories differed in the surveyed genomes (Figure <figr fid="F5">5B</figr>). Paralog representation ranged from 5% for the <it>Neorickettsia sennetsu </it>strain <it>Miyayama </it>(genome size 0.86 Mb) to 44% for <it>Rhizobium leguminosarum </it>bv. <it>vicae </it>(strain 3841) (genome size 7.79 Mb), whereas <it>A. caulinodans </it>had 36% paralogs (genome size 5.37 Mb). The data confirmed the observation that the number of paralogs strongly correlates with the genome size in a linear regression <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>.</p>
            <p>Altogether, these analyses demonstrate that currently <it>X. autotrophicus </it>is the closest sequenced relative of <it>A. caulinodans</it>. However, a comparison of the genomes with the ARTEMIS comparison tool <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> revealed a very low degree of synteny (Additional file <supplr sid="S3">3</supplr>). Although short sequence stretches are conserved, extensive rearrangements have taken place. The occurrence of four prophages and numerous transposases in the <it>A. caulinodans </it>genome suggests a high genome plasticity. In <it>A. caulinodans</it>, 1412 proteins have no counterpart in <it>X. autotrophicus </it>of which 544 (38%) are catalogued as unknown or hypothetical (Additional file <supplr sid="S4">4</supplr>). In the remaining group of functionally classified proteins, 46% have GC and GC3 contents different from the genome averages, suggesting recent acquisition.</p>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p><b>Whole genome comparison of <it>A. caulinodans </it>ORS571 and <it>Xanthobacter autotrophicus </it>Py2 using the ARTEMIS Comparison Tool </b><abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Red and blue lines connect similar sequences and similar sequences that are inverted between strains, respectively.</p>
               </text>
               <file name="1471-2164-9-271-S3.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S4">
               <title>
                  <p>Additional file 4</p>
               </title>
               <text>
                  <p><b>Overview of genes present in the <it>A. caulinodans </it>ORS571 genome and absent in the <it>Xanthobacter autotrophicus </it>Py2 genome</b>. From left to right: unique ID for each <it>A. caulinodans </it>gene; indication of the gene function based on homology; GC content at the third position of codons in percent; GC content of a gene in percent.</p>
               </text>
               <file name="1471-2164-9-271-S4.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Functional protein classes and metabolic pathways</p>
            </st>
            <p>The putative protein-encoding genes were ordered into 17 classes <abbrgrp><abbr bid="B26">26</abbr></abbrgrp> (Table <tblr tid="T1">1</tblr>) and the metabolic potential of <it>A. caulinodans </it>was analyzed with the PathoLogic tool of the BioCyC/MetaCYC suite <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>.</p>
            <p>These analyses revealed the presence of many regulatory genes (8%) and several RNA polymerase &#963; factors, among which two household &#963;<sup>70 </sup>factors (AZC_3643 and AZC_4253), two &#963;<sup>54 </sup>factors (AZC_2924 and AZC_3925; see below), and five &#963; factors of the extracytoplasmic subclass (AZC_0389, AZC_1202, AZC_2427, AZC_2453, and AZC_3238), implying responsiveness to many environmental triggers. As <it>A. caulinodans </it>is a motile bacterium, a large gene cluster is present (AZC_0615-AZC_0666) for the formation of a type-III flagellum. A significant number of chemotaxis genes predicts the capacity to respond to a wide array of molecules (Additional file <supplr sid="S5">5</supplr>). While no complete quorum sensing system could be detected, the presence of no less than five LuxR-type response regulators suggests that <it>A. caulinodans </it>has the potential to listen in on acyl-homoserine lactone-mediated communication in its surroundings.</p>
            <suppl id="S5">
               <title>
                  <p>Additional file 5</p>
               </title>
               <text>
                  <p><b>Chemotaxis and motility genes in the <it>A. caulinodans </it>genome</b>. From left to right: unique ID for each <it>A. caulinodans </it>gene; indication of the gene function based on homology; functional classification of genes according to Riley <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>; GC content at the silent third base of codons in percent; GC content of a gene in percent.</p>
               </text>
               <file name="1471-2164-9-271-S5.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>A variety of encoded proteins might offer protection against toxic compounds in the environment (Additional file <supplr sid="S6">6</supplr>). Examples are two cytochrome P450 monooxygenases and pathways to degrade or modify plant-derived molecules, such as protocatechuate, and xenobiotics, such as cyanate, 1,4-dichlorobenzene, octane, and gallate. Several multidrug efflux pumps, antibiotic-modifying enzymes, and heavy metal translocation systems probably confer resistance to deleterious compounds. The production of the siderophores enterobactin and aerobactin might guarantee iron acquisition from the surroundings.</p>
            <suppl id="S6">
               <title>
                  <p>Additional file 6</p>
               </title>
               <text>
                  <p><b>Putative detoxification genes in <it>A. caulinodans</it></b>. From left to right: unique ID for each <it>A. caulinodans </it>gene; indication of the gene function based on homology; functional classification of genes according to Riley <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>; GC content at the third position of codons in percent; GC content of a gene in percent.</p>
               </text>
               <file name="1471-2164-9-271-S6.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>The surface of bacteria is important for recognition, attachment, and colonization during the interaction with a host. Exopolysaccharides and lipopolysaccharides are involved in nodulation as protective compounds against defense molecules generated by the plant and as communication signals <abbrgrp><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr></abbrgrp>. Other functions could relate to surface structures, important for interaction with the host (Additional file <supplr sid="S7">7</supplr>), e.g. putative adhesion proteins, antigens, and 29 genes that code for proteins with GGDEF/EAL domains. The latter typically play a role in the transition from a motile planktonic form to a sessile biofilm by controlling the formation and degradation of the secondary messenger cyclic di-GMP <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. Hormones also play an important role in plant-microbe interactions. Both a structural (AZC_0267) and a regulatory gene (AZC_0266) mediating degradation of the ethylene precursor 1-aminocyclopropane-1-carboxylate, are present in the genome.</p>
            <suppl id="S7">
               <title>
                  <p>Additional file 7</p>
               </title>
               <text>
                  <p><b>Genes encoding surface-associated components in the <it>A. caulinodans </it>genome</b>. From left to right: unique ID for each <it>A. caulinodans </it>gene; indication of the gene function based on homology; GC content at the third position of codons in percent; GC content of a gene in percent.</p>
               </text>
               <file name="1471-2164-9-271-S7.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>Over 15% of the genes are dedicated to "transport and binding", of which more than 50% belong to the ATP-binding-cassette (ABC) transporter class. With 118 complete systems (consisting of a solute-binding protein, a permease, and an ABC component for the uptake systems, or an ABC component and a permease for the export systems), and numerous orphan subunits scattered over the genome, the transporter complement of <it>A. caulinodans </it>equals that of many other soil bacteria. These high-affinity transport systems are dedicated to the uptake of peptides, amino acids, sugars, polyamines, siderophores, nitrate/sulfonate/bicarbonate, or C4-dicarboxylate and many unknown substrates (Additional file <supplr sid="S8">8</supplr>). Accordingly, catabolic pathways are predicted for compounds, such as amino acids (including citrulline and ornithine), glucuronate, galactonate, galactarate, gluconate, quinate, L-idonate, creatinine, and 4-hydroxymandelate. Sugars, such as glucose, fructose, sucrose, ribose, xylose, xylulose, and lactose are not metabolized by <it>A. caulinodans</it>; instead, dicarboxylic acids are used as primary carbon source <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>, as reflected by the presence of multiple C4-dicarboxylic acid transport systems. The occurrence of 16 putative alcohol dehydrogenase genes suggests that ethanol could be a major carbon source under flooded conditions. <it>A. caulinodans </it>is also capable of oxidizing hydrogen, an obligatory by-product of the nitrogenase, and the required <it>hup, hyp</it>, and <it>hox</it>A genes are located in a large gene cluster (AZC_0594-AZC_0613) <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. Encoded energy metabolism pathways include glycolysis, Entner-Doudoroff, and TCA cycle. The absence of a gene encoding phosphofructokinase indicates the lack of a functional Emden-Meyerhof pathway.</p>
            <suppl id="S8">
               <title>
                  <p>Additional file 8</p>
               </title>
               <text>
                  <p><b>Genes in the <it>A. caulinodans </it>genome dedicated to transport</b>. From left to right: unique ID for each <it>A. caulinodans </it>gene; indication of the gene function based on homology; functional classification of genes according to Riley <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>; position of start codon or stop codon of a gene on the plus or minus strand, respectively; position of stop codon or start codon of a gene on the plus or minus strand, respectively; coding sequence on the plus or minus strand.</p>
               </text>
               <file name="1471-2164-9-271-S8.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Nitrogen fixation and related functions</p>
            </st>
            <p>Table <tblr tid="T2">2</tblr> lists the genomic position of <it>A. caulinodans </it>genes related to free-living and symbiotic nitrogen fixation. These genes code for known functions, such as formation of the nitrogenase, assembly and stabilization of the complex, synthesis of the MoFe cofactor and the FeS clusters, electron transport, ammonium assimilation, and regulation of gene expression by nitrogen and oxygen, but also for proteins whose exact role await experimental confirmation. Several <it>nif </it>genes occur in more than one copy and are scattered over the genome as solitary loci or clusters of varying size with GC and GC3 contents matching the averages of the genome (Additional file <supplr sid="S1">1</supplr>). The NifH phylogeny was congruent with the phylogenetic relationships based on 16S rRNA <abbrgrp><abbr bid="B33">33</abbr></abbrgrp> or on core protein families [Figure <figr fid="F5">5A</figr>]. The same holds true for the other genes listed in Table <tblr tid="T2">2</tblr> (data not shown).</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Nitrogen fixation-related genes</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>Identifier</p>
                     </c>
                     <c ca="left">
                        <p>Gene</p>
                     </c>
                     <c ca="left">
                        <p>Description</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_0344</p>
                     </c>
                     <c ca="left">
                        <p><it>pts</it>N</p>
                     </c>
                     <c ca="left">
                        <p>PTS IIA-like nitrogen-regulatory protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1036</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>X</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase MoFe cofactor biosynthesis</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1037</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>N</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase MoFe cofactor biosynthesis</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1038</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>E</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase MoFe cofactor biosynthesis</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1039</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>K</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase MoFe protein &#946;-chain</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1040</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>D</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase MoFe protein &#945;-chain</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1041</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>H</p>
                     </c>
                     <c ca="left">
                        <p>Dinitrogenase reductase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1049</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>A</p>
                     </c>
                     <c ca="left">
                        <p>Transcriptional activator</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1601</p>
                     </c>
                     <c ca="left">
                        <p><it>gln</it>A</p>
                     </c>
                     <c ca="left">
                        <p>Glutamine synthetase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_1602</p>
                     </c>
                     <c ca="left">
                        <p><it>gln</it>B</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogen regulatory protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_2280</p>
                     </c>
                     <c ca="left">
                        <p><it>ntr</it>B<it>/ntr</it>Y</p>
                     </c>
                     <c ca="left">
                        <p>Signal transduction histidine kinase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_2924</p>
                     </c>
                     <c ca="left">
                        <p><it>rpo</it>F</p>
                     </c>
                     <c ca="left">
                        <p>RNA polymerase &#963;<sup>54 </sup>factor</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3080</p>
                     </c>
                     <c ca="left">
                        <p><it>nfr</it>A</p>
                     </c>
                     <c ca="left">
                        <p>Translation regulator of <it>nif</it>A</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3083</p>
                     </c>
                     <c ca="left">
                        <p><it>ntr</it>X</p>
                     </c>
                     <c ca="left">
                        <p>Transcriptional regulator</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3084</p>
                     </c>
                     <c ca="left">
                        <p><it>ntr</it>Y</p>
                     </c>
                     <c ca="left">
                        <p>Signal transduction histidine kinase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3086</p>
                     </c>
                     <c ca="left">
                        <p><it>ntr</it>C</p>
                     </c>
                     <c ca="left">
                        <p>Transcriptional regulator</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3087</p>
                     </c>
                     <c ca="left">
                        <p><it>ntr</it>B</p>
                     </c>
                     <c ca="left">
                        <p>Signal transduction histidine kinase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3088</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>R3</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogen assimilation-regulatory protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3410</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>U</p>
                     </c>
                     <c ca="left">
                        <p>Mobilization of Fe for Fe-S cluster synthesis and repair</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3411</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>S</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase cofactor synthesis protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3412</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>U</p>
                     </c>
                     <c ca="left">
                        <p>Unknown function</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3414</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>B</p>
                     </c>
                     <c ca="left">
                        <p>Fe and S donor for MoFe cofactor biosynthesis</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3420</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>Z</p>
                     </c>
                     <c ca="left">
                        <p>Unknown function</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3443</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>H</p>
                     </c>
                     <c ca="left">
                        <p>Dinitrogenase reductase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3444</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>Q</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase MoFe cofactor biosynthesis</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3446</p>
                     </c>
                     <c ca="left">
                        <p><it>nif</it>W</p>
                     </c>
                     <c ca="left">
                        <p>Nitrogenase-stabilizing/protective protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3447</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>A</p>
                     </c>
                     <c ca="left">
                        <p>Electron-transferring flavoprotein oxidoreductase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3448</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>B</p>
                     </c>
                     <c ca="left">
                        <p>Electron-transferring flavoprotein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3449</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>C</p>
                     </c>
                     <c ca="left">
                        <p>Electron-transferring flavoprotein oxidoreductase</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3450</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>X</p>
                     </c>
                     <c ca="left">
                        <p>Ferredoxin protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_3925</p>
                     </c>
                     <c ca="left">
                        <p><it>rpo</it>N</p>
                     </c>
                     <c ca="left">
                        <p>RNA polymerase &#963;<sup>54 </sup>factor</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4523</p>
                     </c>
                     <c ca="left">
                        <p><it>cyt</it>N<it>/fix</it>N</p>
                     </c>
                     <c ca="left">
                        <p>Cytochrome c oxidase subunit 1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4524</p>
                     </c>
                     <c ca="left">
                        <p><it>cyt</it>O<it>/fix</it>O</p>
                     </c>
                     <c ca="left">
                        <p>Cytochrome c oxidase subunit 2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4525</p>
                     </c>
                     <c ca="left">
                        <p><it>cyt</it>Q<it>/fix</it>Q</p>
                     </c>
                     <c ca="left">
                        <p>Cytochrome c oxidase subunit 3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4526</p>
                     </c>
                     <c ca="left">
                        <p><it>cyt</it>P<it>/fix</it>P</p>
                     </c>
                     <c ca="left">
                        <p>Cytochrome c oxidase subunit 4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4527</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>G</p>
                     </c>
                     <c ca="left">
                        <p>Assembly and stability of the FixNOQP complex</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4528</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>H</p>
                     </c>
                     <c ca="left">
                        <p>Assembly and stability of the FixNOQP complex</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4653</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>K</p>
                     </c>
                     <c ca="left">
                        <p>Transcriptional activator</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4654</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>L</p>
                     </c>
                     <c ca="left">
                        <p>Sensor protein</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>AZC_4655</p>
                     </c>
                     <c ca="left">
                        <p><it>fix</it>J</p>
                     </c>
                     <c ca="left">
                        <p>Transcriptional regulatory protein</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>The transcriptional activator NifA (AZC_1049) acts together with a &#963;<sup>54 </sup>factor RpoN (AZC_3925) to control the <it>nif/fix </it>gene expression <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. Nitrogen regulation of <it>nifA </it>expression is under control of the NtrBC (AZC_3086-AZC_3087) and NtrYX (AZC_3083-AZC_3084) two-component systems <abbrgrp><abbr bid="B35">35</abbr><abbr bid="B36">36</abbr></abbrgrp> that respond to the intracellular and extracellular nitrogen status, respectively. The expression of these two loci depends on a hypothetical &#963;<sup>54 </sup>factor RpoF <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>, which presumably corresponds to AZC_2924. Oxygen control of <it>nif</it>A expression is mediated by FixLJ (AZC_4654 and AZC_4655) <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>, and the transcription factor FixK (AZC_4653) <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. The <it>nif</it>A gene is further controlled at the transcriptional level by a LysR-type regulator <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> and at the translational level by the <it>nrf</it>A gene product (AZC_3080) <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. FixK also activates transcription of the <it>cyt</it>NOQP operon (AZC_4523-AZC_4526), encoding the high-affinity terminal oxidase cytochrome <it>cbb3 </it>that is induced under microaerobiosis <abbrgrp><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>. Mutants in <it>cyt</it>NOQP still fix nitrogen under free-living conditions, suggesting the occurrence of another terminal oxidase <abbrgrp><abbr bid="B41">41</abbr><abbr bid="B43">43</abbr></abbrgrp>. The survey of the genome excluded the presence of a second cytochrome <it>cbb3 </it>complex, but revealed two cytochrome <it>bd </it>complexes (AZC_1353-AZC_1354 and AZC_3759-AZC_3760).</p>
         </sec>
         <sec>
            <st>
               <p>A symbiosis region</p>
            </st>
            <p>A region of 87.6 kb, delimited by a Gly-tRNA (position 4346061) and an integrase (AZC_3882) and flanked by direct repeats (Figure <figr fid="F6">6</figr>), is characterized by an overall lower GC (Figure <figr fid="F3">3C</figr>) and GC3 contents (Figure <figr fid="F3">3D</figr>) than the genome averages, and a different preferential codon usage (Figure <figr fid="F4">4A</figr>). No less than 18 putative transposases and three integrases are present, suggesting a complex history of horizontal gene transfer events. The region contains the three <it>nod </it>loci that are involved in the synthesis and secretion of the lipochitooligosaccharide Nod factors (NFs) <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>, but also genes related to chemotaxis, amino acid uptake, and a putative type-IV secretion system (Additional file <supplr sid="S1">1</supplr>).</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Schematic representation of the symbiosis region</p>
               </caption>
               <text>
                  <p><b>Schematic representation of the symbiosis region</b>. Genes described in the text are indicated by arrows; the others are not individually represented, but their number is specified in the pentagons. The symbiotic region is flanked by tRNA-Gly (triangles) and interspersed by multiple transposases and integrases (blue lines). Genes in the <it>nod</it>A operon are <it>nod</it>ABCSUIJZ<it>noe</it>CHOP and genes in the <it>trb </it>operon are <it>trb</it>BCDEJLFGI.</p>
               </text>
               <graphic file="1471-2164-9-271-6"/>
            </fig>
            <p>The three <it>nod </it>loci are not adjacent and have a GC content lower than that of the surrounding sequences (Figure <figr fid="F3">3C</figr>). The shifts in GC content correspond to the location of repeated elements that are flanked by insertion sequences or tRNAs (Figures <figr fid="F1">1</figr> and <figr fid="F6">6</figr>). The constitutively expressed <it>nod</it>D gene (AZC_3792) <abbrgrp><abbr bid="B45">45</abbr><abbr bid="B46">46</abbr></abbrgrp> codes for a LysR-type regulator that activates transcription of the two other flavonoid-inducible <it>nod </it>loci. The inducible operon <it>nod</it>ABCSUIJZ<it>noe</it>CHOP (AZC_3818-AZC_3807) <abbrgrp><abbr bid="B47">47</abbr><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr></abbrgrp> encodes most of the enzymatic machinery for NF backbone synthesis, decoration, and secretion. The biochemical role of these proteins has been extensively described, except for the last four open reading frames <it>noe</it>CHOP that are involved in NF arabinosylation and are still under study. Based on similarity with proteins involved in arabinosylation of the cell wall in <it>Mycobacterium tuberculosis</it>, <it>noe</it>C (AZC_3810), <it>noe</it>H (AZC_3809), and <it>noe</it>O (AZC_3808) might encode the synthesis of a D-arabinose precursor <abbrgrp><abbr bid="B50">50</abbr><abbr bid="B51">51</abbr><abbr bid="B52">52</abbr></abbrgrp>. The third locus encodes the inducible <it>nol</it>K gene responsible for GDP-fucose synthesis for NF decoration (AZC_3850) <abbrgrp><abbr bid="B53">53</abbr><abbr bid="B54">54</abbr></abbrgrp>.</p>
            <p>The symbiosis region also contains two conjugation-related gene clusters with GC and GC3 contents comparable to the genome averages. The cluster AZC_3844-AZC_3826 &#8211; flanked by two transposases &#8211; consists of <it>repA </it>and genes encoding conjugal transfer, partition, and plasmid stabilization proteins (Additional file <supplr sid="S1">1</supplr>). In the cluster AZC_3856&#8211;3877, flanked by a transposase and an integrase, genes are found that are homologous to the <it>trb</it>BCDEJLFGI genes, a type-IV secretion system involved in conjugative transfer of the tumor-inducing plasmid in <it>Agrobacterium tumefaciens </it><abbrgrp><abbr bid="B55">55</abbr></abbrgrp> (Figure <figr fid="F6">6</figr>).</p>
            <p>The genome annotation indicates the presence of a few additional nodulation-related genes outside of the symbiosis region (Additional file <supplr sid="S1">1</supplr>). Two response regulators (AZC_1361 and AZC_2281) homologous to <it>nod</it>W genes of <it>Bradyrhizobium japonicum </it>and part of a two-component signal transduction system might be involved in the response to host-exuded flavonoids <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>. A <it>nod</it>T-related gene (AZC_3288) <abbrgrp><abbr bid="B57">57</abbr></abbrgrp> might act as the outer-membrane component in NF secretion together with the inner-membrane NodIJ proteins. None of these four potential nodulation genes has a different GC or GC3 content, in contrast to the <it>nod </it>genes of the symbiosis region.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p><it>Azorhizobium caulinodans </it>is a member of the &#945;-proteobacteria, a group with diverse genome architectures. Several plant-associated representatives, such as <it>Agrobacterium </it>and <it>Sinorhizobium</it>, have quite considerable genomes and large circular or linear plasmids. In contrast, <it>A. caulinodans </it>has a single circular chromosome of 5.37 Mb and no auxiliary replicons. The GC content and the coding density are in range with other rhizobia and soil bacteria. <it>A. caulinodans </it>is a motile, nitrogen-fixing, hydrogen-oxidizing, aerobic bacterium with a preference for organic acids as carbon source. This lifestyle is reflected in the metabolic pathways and in clusters for flagellum synthesis, motility, and chemotaxis. A high number of genes are dedicated to transport and regulation, indicating that a wide range of substrates can be taken up, but that the pathways are tightly regulated to limit the metabolic burden. Besides the well-described role of surface polysaccharides during plant-microbe interactions, the genome of <it>A. caulinodans </it>encodes functions that might be involved in biofilm formation, possibly facilitating the interaction with a host. Ongoing functional analysis will undoubtedly reveal new players in the ecology of the dual lifestyle of <it>A. caulinodans </it><abbrgrp><abbr bid="B58">58</abbr><abbr bid="B59">59</abbr></abbrgrp>.</p>
         <p>Genome analysis combined with phylogenetic studies has shed new light on bacterial evolution and taxonomy. Core functions can be identified that are highly conserved between related groups, but that may acquire individual characteristics through accessory genes <abbrgrp><abbr bid="B60">60</abbr></abbrgrp>. Analysis of a family of core proteins and 16S rDNA sequence comparison revealed that the closest relative of <it>A. caulinodans </it>is <it>Xanthobacter autotrophicus</it>. <it>Xanthobacter </it>sp. are free-living nitrogen fixers and the <it>nif </it>and <it>fix </it>genes can thus be considered part of the core functions of the <it>Azorhizobium-Xanthobacter </it>group. The major difference in the lifestyle of both organisms is that <it>A. caulinodans </it>has acquired the ability to establish a symbiosis with <it>S. rostrata</it>.</p>
         <p>The nodulation capacities are related to the presence of a symbiosis region with distinct GC and GC3 contents and codon usage. The association with tRNA loci, which presumably act as targets for the integration of foreign DNA, and multiple transposons suggest a high plasticity of this region, as reflected in its composition. The symbiosis region contains three subclusters related to nodulation, <it>nod</it>ABCSUIJZ<it>noe</it>CHOP, <it>nod</it>D, and <it>nol</it>K that are flanked by sequences suggestive of independent horizontal acquisition. The repeated elements could be the relics of insertion elements that once played a role in the evolution of the <it>A. caulinodans </it>nodulation genes that have all the characteristics of archetypal accessory genes.</p>
         <p>To study the evolution of <it>nod </it>genes, <it>A. caulinodans </it>forms an interesting case. The azorhizobial <it>nod </it>genes are only distantly related to their counterparts in other rhizobia. Phylogenetic comparisons demonstrated that the <it>nod</it>A and <it>nod</it>C genes from rhizobia that nodulate temperate legumes (e.g. <it>S. meliloti</it>, <it>R. leguminosarum </it>bv. <it>viciae </it>and bv. <it>trifolii</it>, and <it>R. galegae</it>) are grouped together and the genes from rhizobia that nodulate tropical legumes (e.g. <it>B. japonicum</it>, <it>B. elkanii</it>, <it>R. loti</it>, <it>R. tropici</it>, and <it>R. etli</it>) form a second cluster <abbrgrp><abbr bid="B61">61</abbr><abbr bid="B62">62</abbr></abbrgrp>. However, the <it>nod</it>A, <it>nod</it>B, and <it>nod</it>C genes of <it>A. caulinodans </it>belong neither to the tropical nor the temperate clusters <abbrgrp><abbr bid="B62">62</abbr><abbr bid="B63">63</abbr></abbrgrp>. Also, the genetic distance between the <it>nod</it>SU genes of <it>A. caulinodans </it>and their counterparts in other rhizobia is much greater than the mutual genetic distance between the <it>nod</it>SU genes of these rhizobia <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. The organization of the <it>nod</it>ABCSUIJ genes in <it>A. caulinodans </it>resembles the situation in <it>B. japonicum</it>, but the upstream and downstream regions are different <abbrgrp><abbr bid="B64">64</abbr><abbr bid="B65">65</abbr></abbrgrp>.</p>
         <p>At present we do not know the origin of the symbiotic genes of <it>A. caulinodans</it>. The Rhizobiaceae, which have been historically considered a true family in phylogenetic terms, now seem a rather diverse group of bacteria, including <it>Methylobacterium</it>, <it>Ralstonia</it>, and <it>Burkholderia </it>that share variant, relatively recently acquired, symbiotic gene clusters. Possibly, the <it>A. caulinodans nod </it>genes are derived from unexplored rhizobia or even from obligate endophytes. Undoubtedly, the recent and ongoing explosion in meta-genomic projects will provide more insight into the origin of the nodulation functions.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>Extension of symbiotic nitrogen fixation to non-legume cereal plants is a challenging long-standing goal. Especially, there is a growing interest in nitrogen-fixing organisms that could establish an endophytic, beneficial relation with important crops, such as rice and wheat (<it>Triticum aestivum</it>). Interestingly in this context, the occurrence of <it>A. caulinodans </it>has been reported in intercellular infection pockets located in the cortex of roots of <it>Arabidopsis thaliana </it>and wheat <abbrgrp><abbr bid="B66">66</abbr></abbrgrp>. In fields where <it>S. rostrata </it>and rice are grown as rotation crops, <it>A. caulinodans </it>seems to survive very well in the rhizosphere of the rice plants and in the soil <abbrgrp><abbr bid="B67">67</abbr></abbrgrp>. Moreover, the bacterium invades emerging lateral roots of rice, and rice seedlings inoculated with <it>A. caulinodans </it>have a high nitrogenase activity <abbrgrp><abbr bid="B68">68</abbr></abbrgrp>. Finally, <it>A. caulinodans </it>fixes nitrogen under relatively high oxygen tension as a free-living organism, invades the host via cracks, and establishes intercellular colonies. Altogether, these features might be advantageous for primary infection of nitrogen-starved root systems and highlight the potential of <it>A. caulinodans </it>as a candidate model organism. The genome sequence data provide new opportunities for exploring the regulatory aspects of <it>Azorhizobium </it>nitrogen fixation and the essential features that implement the ability for endosymbiosis.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>DNA sequencing</p>
            </st>
            <p>The nucleotide sequence of the entire genome of <it>A. caulinodans </it>ORS571 was determined by the whole-genome shotgun strategy method. For shotgun cloning, DNA fragments of 2 to 3 kb were cloned into the <it>Hin</it>cII site of pUC118. For gap closing, the pCC1Fos vector (Epicentre, Madison, WI, USA) was used, and approximately 35-kb clones were prepared. The accumulated sequence files were assembled with the Phrap program <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. A total of 71,424 random sequence files corresponding to approximately 7.7 genome equivalents were assembled to generate draft sequences. Finishing was carried out by visual editing of the sequences, followed by gap closing, and additional sequencing to obtain sequence data with a Phred score of 20 or higher <abbrgrp><abbr bid="B70">70</abbr><abbr bid="B71">71</abbr></abbrgrp>. The integrity of the final genome sequence was assessed by comparing the insert length of each fosmid clone with the computed distance between the end sequences of the clones. The end sequence data facilitated gap closure as well as accurate reconstruction of the entire genome. The final gaps in the sequences were filled by the primer walking method. A lower threshold of acceptability for the generation of consensus sequences was set at a Phred score of 20 for each base. The nucleotide sequence is available in the DDBJ/EMBL/GenBank databases under the accession number <ext-link ext-link-type="gen" ext-link-id="AP009384">AP009384</ext-link>.</p>
         </sec>
         <sec>
            <st>
               <p>Structural and functional annotation</p>
            </st>
            <p>Coding regions were assigned by a combination of computer prediction and similarity search. Briefly, the protein-coding regions were predicted with the Glimmer 2.02 program <abbrgrp><abbr bid="B72">72</abbr></abbrgrp> and all regions equal to or longer than 90 bp were translated into amino acid sequences that were subjected to similarity searches against the nonredundant protein database at NCBI with the BLASTP program <abbrgrp><abbr bid="B73">73</abbr></abbrgrp>. In parallel, the entire genomic sequence was compared with those in the nonredundant protein database with the BLASTX program <abbrgrp><abbr bid="B73">73</abbr></abbrgrp> to identify genes that had escaped prediction and/or were smaller than 90 bp, especially in the predicted intergenic regions. For predicted genes without sequence similarity to known genes, only those equal to or longer than 150 bp were considered as candidates. Functions were assigned to the predicted genes based on sequence similarity of their deduced products to that of genes of known function. For genes that encode proteins of 100 amino acid residues or more, an E-value of 10<sup>-20 </sup>was considered significant, whereas a higher E-value was significant for genes encoding smaller proteins (E-value treshold of 10<sup>-10</sup>). Genes for structural RNAs were assigned by similarity search against the in-house structural RNA database that had been generated based on the GenBank data. tRNA-encoding regions were predicted by the tRNAscan-SE 1.21 program <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> in combination with the similarity search.</p>
            <p>MetaCyc analysis <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B74">74</abbr></abbrgrp> detected 229 metabolic pathways, containing 1037 reaction steps. To assess the presence or absence of a metabolic pathway and to decrease the likelihood of being misled by the many enzymes that are shared among multiple pathways, the analysis was emphasized on the presence of enzymes that are unique to a pathway.</p>
         </sec>
         <sec>
            <st>
               <p>Construction of a phylogenetic tree</p>
            </st>
            <p>The Maximum-likelihood tree was based on 108 core proteins of 45 &#945;-proteobacteria <abbrgrp><abbr bid="B23">23</abbr></abbrgrp> whose sequence data and annotation files were available and downloaded from the NCBI Microbial Genome Resource database <abbrgrp><abbr bid="B75">75</abbr></abbrgrp>. The set of core genes was determined by an all-against-all BLAST at protein level. Best reciprocal hits were selected, taking into account a cut-off value defined as 20% similarity and an overlap of at least 150 amino acids. Only proteins present in all 45 genomes as single copy were considered as "core proteins" and used to construct the phylogenetic tree. The total alignment contained 32,327 amino acids. The tree was constructed with the Phyml program <abbrgrp><abbr bid="B76">76</abbr></abbrgrp> and a WAG substitution model <abbrgrp><abbr bid="B77">77</abbr></abbrgrp> and 100 bootstrap replicates were run. Unless indicated otherwise, bootstraps are 100 (Figure <figr fid="F5">5A</figr>).</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>K-BL contributed to the sequence determination and carried out the annotation of the genes. PDB analyzed the data generating the figures and the manuscript. TA, C-TL, SS, and TS contributed to the sequence determination. TK, MY, and ST annotated the gene sequences. DMK, FZN and GBW sequenced the DNA and assembled and interpreted the DNA sequence data. BR participated in the design and coordination of the study, in particular the original conception, the DNA sequencing, and subsequent DNA analysis. TTB and DWU constructed and analyzed the BLASTatlas of <it>Azorhizobium</it>. WD'H assisted in the preparation of the <it>Azorhizobium </it>genomic DNA and analysis of genetic data. JDH contributed to the MetaCyc analysis. DG carried out the evolutionary analysis of the genome. DV and MH interpreted the data and figures and wrote the article. HO contributed to sequence determination and gene annotation. All authors have read and approved the final version of the manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>This work was supported by grants from the Bio-oriented Technology Research Advancement Institution (BRAIN) of Japan and the "Geconcerteerde Onderzoeksacties" (GOA 01GA0105) of the Ghent University.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>How rhizobial symbionts invade plants: the <it>Sinorhizobium </it>&#8211; <it>Medicago </it>model</p>
            </title>
            <aug>
               <au>
                  <snm>Jones</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Kobayashi</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Davies</snm>
                  <fnm>BW</fnm>
               </au>
               <au>
                  <snm>Taga</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Walker</snm>
                  <fnm>GC</fnm>
               </au>
            </aug>
            <source>Nat Rev Microbiol</source>
            <pubdate>2007</pubdate>
            <volume>5</volume>
            <fpage>619</fpage>
            <lpage>633</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nrmicro1705</pubid>
                  <pubid idtype="pmpid" link="fulltext">17632573</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Stem nodulation in legumes: diversity, mechanisms and unusual characters</p>
            </title>
            <aug>
               <au>
                  <snm>Boivin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ndoye</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Molouba</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>de Lajudie</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Dreyfus</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Crit Rev Plant Sci</source>
            <pubdate>1997</pubdate>
            <volume>16</volume>
            <fpage>1</fpage>
            <lpage>30</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1080/713608143</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Nodulation in Legumes</p>
            </title>
            <aug>
               <au>
                  <snm>Sprent</snm>
                  <fnm>JI</fnm>
               </au>
            </aug>
            <publisher>Kew: Royal Botanical Gardens</publisher>
            <pubdate>2002</pubdate>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Nitrogen-fixing nodules induced by <it>Rhizobium </it>on the stem of the tropical legume <it>Sesbania rostrata</it></p>
            </title>
            <aug>
               <au>
                  <snm>Dreyfus</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Dommergues</snm>
                  <fnm>YR</fnm>
               </au>
            </aug>
            <source>FEMS Microbiol Lett</source>
            <pubdate>1981</pubdate>
            <volume>10</volume>
            <fpage>313</fpage>
            <lpage>317</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1111/j.1574-6968.1981.tb06262.x</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Nature des sites d'infection par le <it>Rhizobium </it>de la tige de la l&#233;gumineuse <it>Sesbania rostrata </it>Brem</p>
            </title>
            <aug>
               <au>
                  <snm>Duhoux</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Dreyfus</snm>
                  <fnm>BL</fnm>
               </au>
            </aug>
            <source>C R Hebd S&#233;ances Acad Sci Paris</source>
            <pubdate>1982</pubdate>
            <volume>294</volume>
            <fpage>407</fpage>
            <lpage>411</lpage>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Signaling and gene expression for water-tolerant legume nodulation</p>
            </title>
            <aug>
               <au>
                  <snm>Den Herder</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Schroeyers</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Goormachtig</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Crit Rev Plant Sci</source>
            <pubdate>2006</pubdate>
            <volume>25</volume>
            <fpage>367</fpage>
            <lpage>380</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1080/07352680600794257</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>The <it>Sesbania </it>root symbionts <it>Sinorhizobium saheli </it>and <it>S. teranga </it>bv. sesbaniae can form stem nodules on <it>Sesbania rostrata</it>, although they are less adapted to stem nodulation than <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Boivin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ndoye</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Lortet</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Ndiaye</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>de Lajudie</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Dreyfus</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>1997</pubdate>
            <volume>63</volume>
            <fpage>1040</fpage>
            <lpage>1047</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1389132</pubid>
                  <pubid idtype="pmpid" link="fulltext">16535538</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>The <it>nodS </it>gene of <it>Rhizobium tropici </it>strain CIAT899 is necessary for nodulation on <it>Phaseolus vulgaris </it>and on <it>Leucaena leucocephala</it></p>
            </title>
            <aug>
               <au>
                  <snm>Waelkens</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Voets</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Vlassak</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Vanderleyden</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>van Rhijn</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1995</pubdate>
            <volume>8</volume>
            <fpage>147</fpage>
            <lpage>154</lpage>
            <xrefbib>
               <pubid idtype="pmpid">7772799</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Genetic analysis of nitrogen fixation in a tropical fast-growing <it>Rhizobium</it></p>
            </title>
            <aug>
               <au>
                  <snm>Elmerich</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Dreyfus</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Reysset</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Aubert</snm>
                  <fnm>J-P</fnm>
               </au>
            </aug>
            <source>EMBO J</source>
            <pubdate>1982</pubdate>
            <volume>1</volume>
            <fpage>499</fpage>
            <lpage>503</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">553074</pubid>
                  <pubid idtype="pmpid">16453420</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Intra- and intergeneric similarities between the ribosomal ribonucleic acid cistrons of <it>Rhizobium </it>and <it>Bradyrhizobium </it>species and some related bacteria</p>
            </title>
            <aug>
               <au>
                  <snm>Jarvis</snm>
                  <fnm>BDW</fnm>
               </au>
               <au>
                  <snm>Gillis</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>De Ley</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Int J Syst Bacteriol</source>
            <pubdate>1986</pubdate>
            <volume>36</volume>
            <fpage>129</fpage>
            <lpage>138</lpage>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Characterization of <it>Azorhizobium caulinodans </it>gen. nov, sp. nov, a stem-nodulating nitrogen-fixing bacterium isolated from <it>Sesbania rostrata</it></p>
            </title>
            <aug>
               <au>
                  <snm>Dreyfus</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Garcia</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Gillis</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Int J Syst Bacteriol</source>
            <pubdate>1988</pubdate>
            <volume>38</volume>
            <fpage>89</fpage>
            <lpage>98</lpage>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Effect of Xanthobacter, isolated and characterized from rice roots, on growth on wetland rice</p>
            </title>
            <aug>
               <au>
                  <snm>Reding</snm>
                  <fnm>HK</fnm>
               </au>
               <au>
                  <snm>Hartel</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Wiegel</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Plant Soil</source>
            <pubdate>1991</pubdate>
            <volume>138</volume>
            <fpage>221</fpage>
            <lpage>229</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/BF00012249</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>The genus <it>Xanthobacter</it></p>
            </title>
            <aug>
               <au>
                  <snm>Wiegel</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>The Prokaryotes. A Handbook on the Biology of Bacteria: Ecophysiology, Isolation, Identification, Applications</source>
            <publisher>Berlin: Springer-Verlag</publisher>
            <editor>Balows A, Tr&#252;per HG, Dworkin M, Harder W, Schleifer K-H</editor>
            <edition>2</edition>
            <pubdate>1992</pubdate>
            <volume>III</volume>
            <fpage>2365</fpage>
            <lpage>2383</lpage>
         </bibl>
         <bibl id="B14">
            <title>
               <p>16S ribosomal DNA sequence analysis confirms the close relationship between the genera <it>Xanthobacter, Azorhizobium</it>, and <it>Aquabacter </it>and reveals a lack of phylogenetic coherence among <it>Xanthobacter </it>species</p>
            </title>
            <aug>
               <au>
                  <snm>Rainey</snm>
                  <fnm>FA</fnm>
               </au>
               <au>
                  <snm>Wiegel</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Int J Syst Bacteriol</source>
            <pubdate>1996</pubdate>
            <volume>46</volume>
            <fpage>607</fpage>
            <lpage>610</lpage>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Rhizobase: The Genome Database for Rhizobia</p>
            </title>
            <url>http://bacteria.kazusa.or.jp/rhizobase</url>
         </bibl>
         <bibl id="B16">
            <title>
               <p>The genome BLASTatlas &#8211; a GeneWiz extension for visualization of whole-genome homology</p>
            </title>
            <aug>
               <au>
                  <snm>Hallin</snm>
                  <fnm>PF</fnm>
               </au>
               <au>
                  <snm>Binnewies</snm>
                  <fnm>TT</fnm>
               </au>
               <au>
                  <snm>Ussery</snm>
                  <fnm>DW</fnm>
               </au>
            </aug>
            <source>Mol BioSyst</source>
            <pubdate>2008</pubdate>
            <volume>4</volume>
            <fpage>363</fpage>
            <lpage>371</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1039/b717118h</pubid>
                  <pubid idtype="pmpid" link="fulltext">18414733</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>The Genome Atlas Tool Output for the <it>Azorhizobium caulinodans </it>ORS571 Genome</p>
            </title>
            <url>http://www.cbs.dtu.dk/~tim/Azorhizobium.html</url>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Origin of replication in circular prokaryotic chromosomes</p>
            </title>
            <aug>
               <au>
                  <snm>Worning</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Jensen</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Hallin</snm>
                  <fnm>PF</fnm>
               </au>
               <au>
                  <snm>St&#230;rfeldt</snm>
                  <fnm>H-H</fnm>
               </au>
               <au>
                  <snm>Ussery</snm>
                  <fnm>DW</fnm>
               </au>
            </aug>
            <source>Environ Microbiol</source>
            <pubdate>2006</pubdate>
            <volume>8</volume>
            <fpage>353</fpage>
            <lpage>361</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1462-2920.2005.00917.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">16423021</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Conserved gene cluster at replication origins of the &#945;-proteobacteria <it>Caulobacter crescentus </it>and <it>Rickettsia prowazekii</it></p>
            </title>
            <aug>
               <au>
                  <snm>Brassinga</snm>
                  <fnm>AKC</fnm>
               </au>
               <au>
                  <snm>Siam</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Marczynski</snm>
                  <fnm>GT</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2001</pubdate>
            <volume>183</volume>
            <fpage>1824</fpage>
            <lpage>1829</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">95075</pubid>
                  <pubid idtype="pmpid" link="fulltext">11160121</pubid>
                  <pubid idtype="doi">10.1128/JB.183.5.1824-1829.2001</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>FtsK, a literate chromosome segregation machine</p>
            </title>
            <aug>
               <au>
                  <snm>Bigot</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sivanathan</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Possoz</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Barre</snm>
                  <fnm>F-X</fnm>
               </au>
               <au>
                  <snm>Cornet</snm>
                  <fnm>F</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2007</pubdate>
            <volume>64</volume>
            <fpage>1434</fpage>
            <lpage>1441</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.2007.05755.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">17511809</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence</p>
            </title>
            <aug>
               <au>
                  <snm>Lowe</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <fpage>955</fpage>
            <lpage>964</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">146525</pubid>
                  <pubid idtype="pmpid" link="fulltext">9023104</pubid>
                  <pubid idtype="doi">10.1093/nar/25.5.955</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>The hierarchical system of the 'Alphaproteobacteria': description of <it>Hyphomonadaceae </it>fam. nov, <it>Xanthobacteraceae </it>fam. nov. and <it>Erythrobacteraceae </it>fam. nov</p>
            </title>
            <aug>
               <au>
                  <snm>Lee</snm>
                  <fnm>K-B</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>C-T</fnm>
               </au>
               <au>
                  <snm>Anzai</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Aono</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Oyaizu</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Int J Syst Evol Microbiol</source>
            <pubdate>2005</pubdate>
            <volume>55</volume>
            <fpage>1907</fpage>
            <lpage>1919</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1099/ijs.0.63663-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">16166687</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>A robust species tree for the <it>Alphaproteobacteria</it></p>
            </title>
            <aug>
               <au>
                  <snm>Williams</snm>
                  <fnm>KP</fnm>
               </au>
               <au>
                  <snm>Sobral</snm>
                  <fnm>BW</fnm>
               </au>
               <au>
                  <snm>Dickerman</snm>
                  <fnm>AW</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2007</pubdate>
            <volume>189</volume>
            <fpage>4578</fpage>
            <lpage>4586</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1913456</pubid>
                  <pubid idtype="pmpid" link="fulltext">17483224</pubid>
                  <pubid idtype="doi">10.1128/JB.00269-07</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Gene duplication and biased functional retention of paralogs in bacterial genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Gevers</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Vandepoele</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Simillion</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Van de Peer</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>Trends Microbiol</source>
            <pubdate>2004</pubdate>
            <volume>12</volume>
            <fpage>148</fpage>
            <lpage>154</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tim.2004.02.007</pubid>
                  <pubid idtype="pmpid" link="fulltext">15116722</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>ACT: the Artemis comparison tool</p>
            </title>
            <aug>
               <au>
                  <snm>Carver</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Rutherford</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Berriman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rajandream</snm>
                  <fnm>M-A</fnm>
               </au>
               <au>
                  <snm>Barrell</snm>
                  <fnm>BG</fnm>
               </au>
               <au>
                  <snm>Parkhill</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>3422</fpage>
            <lpage>3423</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/bti553</pubid>
                  <pubid idtype="pmpid" link="fulltext">15976072</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Systems for categorizing functions of gene products</p>
            </title>
            <aug>
               <au>
                  <snm>Riley</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Curr Opin Struct Biol</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>388</fpage>
            <lpage>392</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0959-440X(98)80074-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">9666336</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>MetaCyc: a multiorganism database of metabolic pathways and enzymes</p>
            </title>
            <aug>
               <au>
                  <snm>Caspi</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Foerster</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Fulcher</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Hopkinson</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ingraham</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kaipa</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Krummenacker</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Paley</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Pick</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Rhee</snm>
                  <fnm>SY</fnm>
               </au>
               <au>
                  <snm>Tissier</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Karp</snm>
                  <fnm>PD</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2006</pubdate>
            <volume>34</volume>
            <fpage>D511</fpage>
            <lpage>D516</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1347490</pubid>
                  <pubid idtype="pmpid" link="fulltext">16381923</pubid>
                  <pubid idtype="doi">10.1093/nar/gkj128</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Roles for azorhizobial Nod factors and surface polysaccharides in intercellular invasion and nodule penetration, respectively</p>
            </title>
            <aug>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>De Rycke</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Engler</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1998</pubdate>
            <volume>11</volume>
            <fpage>999</fpage>
            <lpage>1008</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1094/MPMI.1998.11.10.999</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Structural characterization of extracellular polysaccharides of <it>Azorhizobium caulinodans </it>and importance for nodule initiation on <it>Sesbania rostrata</it></p>
            </title>
            <aug>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Glushka</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>De Rycke</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carlson</snm>
                  <fnm>RW</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2004</pubdate>
            <volume>52</volume>
            <fpage>485</fpage>
            <lpage>500</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.2004.03989.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15066035</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Lipopolysaccharides as a communication signal for progression of legume endosymbiosis</p>
            </title>
            <aug>
               <au>
                  <snm>Mathis</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Van Gijsegem</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>De Rycke</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Van Maelsaeke</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Anthonio</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Vereecke</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2005</pubdate>
            <volume>102</volume>
            <fpage>2655</fpage>
            <lpage>2660</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">549025</pubid>
                  <pubid idtype="pmpid" link="fulltext">15699329</pubid>
                  <pubid idtype="doi">10.1073/pnas.0409816102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Mechanisms of cyclic-di-GMP signaling in bacteria</p>
            </title>
            <aug>
               <au>
                  <snm>Jenal</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Malone</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Annu Rev Genet</source>
            <pubdate>2006</pubdate>
            <volume>40</volume>
            <fpage>385</fpage>
            <lpage>407</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.genet.40.110405.090423</pubid>
                  <pubid idtype="pmpid" link="fulltext">16895465</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Diversity and evolution of hydrogenase systems in rhizobia</p>
            </title>
            <aug>
               <au>
                  <snm>Baginsky</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Brito</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Imperial</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Palacios</snm>
                  <fnm>J-M</fnm>
               </au>
               <au>
                  <snm>Ruiz-Arg&#252;eso</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>2002</pubdate>
            <volume>68</volume>
            <fpage>4915</fpage>
            <lpage>4924</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">126442</pubid>
                  <pubid idtype="pmpid" link="fulltext">12324339</pubid>
                  <pubid idtype="doi">10.1128/AEM.68.10.4915-4924.2002</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Classification of rhizobia based on <it>nodC </it>and <it>nifH </it>gene analysis reveals a close phylogenetic relationship among <it>Phaseolus vulgaris </it>symbionts</p>
            </title>
            <aug>
               <au>
                  <snm>Laguerre</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Nour</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Macheret</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Sanjuan</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Drouin</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Amarger</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Microbiology</source>
            <pubdate>2001</pubdate>
            <volume>147</volume>
            <fpage>981</fpage>
            <lpage>993</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11283294</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p><it>Azorhizobium caulinodans </it>nitrogen fixation (<it>nif/fix</it>) gene regulation: mutagenesis of the <it>nifA</it>-24/-12 promoter element, characterization of a <it>nrtA(rpoN</it>) gene, and derivation of a model</p>
            </title>
            <aug>
               <au>
                  <snm>Stigter</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Schneider</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>de Bruijn</snm>
                  <fnm>FJ</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1993</pubdate>
            <volume>6</volume>
            <fpage>238</fpage>
            <lpage>252</lpage>
            <xrefbib>
               <pubid idtype="pmpid">8471796</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Cloning and characterization of <it>nifA </it>and <it>ntrC </it>genes of the stem nodulating bacterium ORS571, the nitrogen fixing symbiont of <it>Sesbania rostrata</it>: regulation of nitrogen fixation (<it>nif</it>) genes in the free living versus symbiotic state</p>
            </title>
            <aug>
               <au>
                  <snm>Pawlowski</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Ratet</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Schell</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>de Bruijn</snm>
                  <fnm>FJ</fnm>
               </au>
            </aug>
            <source>Mol Gen Genet</source>
            <pubdate>1987</pubdate>
            <volume>206</volume>
            <fpage>207</fpage>
            <lpage>219</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/BF00333576</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Characterization of a novel <it>Azorhizobium caulinodans </it>ORS571 two-component regulatory system, NtrY/NtrX, involved in nitrogen fixation and metabolism</p>
            </title>
            <aug>
               <au>
                  <snm>Pawlowski</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Klosse</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>de Bruijn</snm>
                  <fnm>FJ</fnm>
               </au>
            </aug>
            <source>Mol Gen Genet</source>
            <pubdate>1991</pubdate>
            <volume>231</volume>
            <fpage>124</fpage>
            <lpage>138</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/BF00293830</pubid>
                  <pubid idtype="pmpid">1661370</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Involvement of <it>fixLJ </it>in the regulation of nitrogen fixation in <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Kaminski</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Elmerich</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1991</pubdate>
            <volume>5</volume>
            <fpage>665</fpage>
            <lpage>673</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.1991.tb00738.x</pubid>
                  <pubid idtype="pmpid">2046550</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Regulation of nitrogen fixation in <it>Azorhizobium caulinodans </it>: identification of a <it>fixK</it>-like gene, a positive regulator of <it>nifA</it></p>
            </title>
            <aug>
               <au>
                  <snm>Kaminski</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Mandon</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Arigoni</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Desnoues</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Elmerich</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1991</pubdate>
            <volume>5</volume>
            <fpage>1983</fpage>
            <lpage>1991</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.1991.tb00820.x</pubid>
                  <pubid idtype="pmpid">1766374</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Regulation of free-living and symbiotic nitrogen fixation in <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Kaminski</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Michel-Reydellet</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Desnoues</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Elmerich</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Nitrogen Fixation: Fundamentals and Applications, Current Plant Science and Biotechnology in Agriculture</source>
            <publisher>Dordrecht: Kluwer Academic Publishers</publisher>
            <editor>Tikhonovich IA, Provorov NA, Romanov VI, Newton WE</editor>
            <pubdate>1995</pubdate>
            <volume>27</volume>
            <fpage>183</fpage>
            <lpage>187</lpage>
         </bibl>
         <bibl id="B40">
            <title>
               <p>The expression of <it>nifA </it>in <it>Azorhizobium caulinodans </it>requires a gene product homologous to <it>Escherichia coli </it>HF-I, an RNA-binding protein involved in the replication of phage Q&#946; RNA</p>
            </title>
            <aug>
               <au>
                  <snm>Kaminski</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Desnoues</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Elmerich</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1994</pubdate>
            <volume>91</volume>
            <fpage>4663</fpage>
            <lpage>4667</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">43848</pubid>
                  <pubid idtype="pmpid" link="fulltext">8197116</pubid>
                  <pubid idtype="doi">10.1073/pnas.91.11.4663</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Functional analysis of the <it>fixNOQP </it>region of <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Mandon</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kaminski</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Elmerich</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1994</pubdate>
            <volume>176</volume>
            <fpage>2560</fpage>
            <lpage>2568</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">205393</pubid>
                  <pubid idtype="pmpid" link="fulltext">8169204</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p><it>Azorhizobium caulinodans </it>uses both cytochrome <it>bd </it>(quinol) and cytochrome <it>cbb </it><sub>3</sub> (cytochrome <it>c</it>) terminal oxidases for symbiotic N<sub>2 </sub>fixation</p>
            </title>
            <aug>
               <au>
                  <snm>Kaminski</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Kitts</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Zimmerman</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Ludwig</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1996</pubdate>
            <volume>178</volume>
            <fpage>5989</fpage>
            <lpage>5994</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">178456</pubid>
                  <pubid idtype="pmpid" link="fulltext">8830696</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p><it>Azorhizobium caulinodans </it>respires with at least four terminal oxidases</p>
            </title>
            <aug>
               <au>
                  <snm>Kitts</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Ludwig</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1994</pubdate>
            <volume>176</volume>
            <fpage>886</fpage>
            <lpage>895</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">205126</pubid>
                  <pubid idtype="pmpid" link="fulltext">8300541</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Nod factor structures, responses, and perception during initiation of nodule development</p>
            </title>
            <aug>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Glycobiology</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>79R</fpage>
            <lpage>105R</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/glycob/12.6.79R</pubid>
                  <pubid idtype="pmpid" link="fulltext">12107077</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Identification and characterization of a functional <it>nodD </it>gene in <it>Azorhizobium caulinodans </it>strain ORS571</p>
            </title>
            <aug>
               <au>
                  <snm>Goethals</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Van den Eede</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1990</pubdate>
            <volume>172</volume>
            <fpage>2658</fpage>
            <lpage>2666</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">208910</pubid>
                  <pubid idtype="pmpid" link="fulltext">2158977</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>The <it>nodD </it>locus from <it>Azorhizobium caulinodans </it>is flanked by two repetitive elements</p>
            </title>
            <aug>
               <au>
                  <snm>Geelen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Goethals</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>1995</pubdate>
            <volume>164</volume>
            <fpage>107</fpage>
            <lpage>111</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0378-1119(95)00456-G</pubid>
                  <pubid idtype="pmpid" link="fulltext">7590297</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Common <it>nodABC </it>genes in <it>Nod </it>locus 1 of <it>Azorhizobium caulinodans</it>: nucleotide sequence and plant-inducible expression</p>
            </title>
            <aug>
               <au>
                  <snm>Goethals</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Tomekpe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Gen Genet</source>
            <pubdate>1989</pubdate>
            <volume>219</volume>
            <fpage>289</fpage>
            <lpage>298</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/BF00261190</pubid>
                  <pubid idtype="pmpid">2615763</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Identification of <it>nodSUIJ </it>genes in Nod locus <it>1 </it>of <it>Azorhizobium caulinodans</it>: evidence that <it>nodS </it>encodes a methyltransferase involved in Nod factor modification</p>
            </title>
            <aug>
               <au>
                  <snm>Geelen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mergaert</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Geremia</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Goormachtig</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1993</pubdate>
            <volume>9</volume>
            <fpage>145</fpage>
            <lpage>154</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.1993.tb01676.x</pubid>
                  <pubid idtype="pmpid">8412659</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Fucosylation and arabinosylation of Nod factors in <it>Azorhizobium caulinodans</it>: involvement of <it>nolK</it>, <it>nodZ</it>, and <it>noeC</it>, and/or downstream genes</p>
            </title>
            <aug>
               <au>
                  <snm>Mergaert</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Fern&#225;ndez-L&#243;pez</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Geelen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Goethals</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Prom&#233;</snm>
                  <fnm>J-C</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1996</pubdate>
            <volume>21</volume>
            <fpage>409</fpage>
            <lpage>419</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.1996.6451366.x</pubid>
                  <pubid idtype="pmpid">8858594</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Identification and active expression of the <it>Mycobacterium tuberculosis </it>gene encoding 5-phospho-&#945;-D-ribose-1-diphosphate:decaprenyl-phosphate 5-phosphoribosyltransferase, the first enzyme committed to decaprenylphosphoryl-D-arabinose synthesis</p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Scherman</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Vereecke</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Crick</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>McNeil</snm>
                  <fnm>MR</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>2005</pubdate>
            <volume>208</volume>
            <fpage>24539</fpage>
            <lpage>24543</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.M504068200</pubid>
                  <pubid idtype="pmpid">15878857</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>Decaprenylphosphoryl arabinofuranose, the donor of the D-arabinofuranosyl residues of mycobacterial arabinan, is formed via a two-step epimerization of decaprenylphosphoryl ribose</p>
            </title>
            <aug>
               <au>
                  <snm>Miku&#353;ov&#225;</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Yagi</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Vereecke</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Scherman</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Brennan</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>McNeil</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Crick</snm>
                  <fnm>DC</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2005</pubdate>
            <volume>187</volume>
            <fpage>8020</fpage>
            <lpage>8025</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1291263</pubid>
                  <pubid idtype="pmpid" link="fulltext">16291675</pubid>
                  <pubid idtype="doi">10.1128/JB.187.23.8020-8025.2005</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Identification of amino acids and domains required for catalytic activity of DPPR synthase, a cell wall biosynthetic enzyme of <it>Mycobacterium tuberculosis</it></p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Berg</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Spencer</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Vereecke</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>McNeil</snm>
                  <fnm>MR</fnm>
               </au>
            </aug>
            <source>Microbiology</source>
            <pubdate>2008</pubdate>
            <volume>154</volume>
            <fpage>736</fpage>
            <lpage>743</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1099/mic.0.2007/013532-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">18310020</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>Identification of a new inducible nodulation gene in <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Goethals</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Mergaert</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Geelen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1992</pubdate>
            <volume>5</volume>
            <fpage>405</fpage>
            <lpage>411</lpage>
            <xrefbib>
               <pubid idtype="pmpid">1472718</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>Nod factors of <it>Azorhizobium caulinodans </it>strain ORS571 can be glycosylated with an arabinosyl group, a fucosyl group, or both</p>
            </title>
            <aug>
               <au>
                  <snm>Mergaert</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ferro</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>D'Haeze</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Van Montagu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Holsters</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Prom&#233;</snm>
                  <fnm>J-C</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1997</pubdate>
            <volume>10</volume>
            <fpage>683</fpage>
            <lpage>687</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1094/MPMI.1997.10.5.683</pubid>
                  <pubid idtype="pmpid" link="fulltext">9204572</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>Biogenesis, architecture, and function of bacterial type IV secretion systems</p>
            </title>
            <aug>
               <au>
                  <snm>Christie</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Atmakuri</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Krishnamoorthy</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Jakubowski</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cascales</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Annu Rev Microbiol</source>
            <pubdate>2005</pubdate>
            <volume>59</volume>
            <fpage>451</fpage>
            <lpage>485</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.micro.58.030603.123630</pubid>
                  <pubid idtype="pmpid" link="fulltext">16153176</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>Proposed regulatory pathway encoded by the <it>nodV </it>and <it>nodW </it>genes, determinants of host specificity in <it>Bradyrhizobium japonicum</it></p>
            </title>
            <aug>
               <au>
                  <snm>G&#246;ttfert</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Grob</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Hennecke</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1990</pubdate>
            <volume>87</volume>
            <fpage>2680</fpage>
            <lpage>2684</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">53754</pubid>
                  <pubid idtype="pmpid" link="fulltext">2320582</pubid>
                  <pubid idtype="doi">10.1073/pnas.87.7.2680</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p><it>Rhizobium leguminosarum </it>NodT is related to a family of outer-membrane transport proteins that includes TolC, PrtF, CyaE and AprF</p>
            </title>
            <aug>
               <au>
                  <snm>Rivilla</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Downie</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>1995</pubdate>
            <volume>161</volume>
            <fpage>27</fpage>
            <lpage>31</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0378-1119(95)00235-X</pubid>
                  <pubid idtype="pmpid" link="fulltext">7642132</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>Rhizobial factors required for stem nodule maturation and maintenance in <it>Sesbania rostrata </it>&#8211; <it>Azorhizobium caulinodans </it>ORS571 symbiosis</p>
            </title>
            <aug>
               <au>
                  <snm>Suzuki</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Aono</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>K-B</fnm>
               </au>
               <au>
                  <snm>Suzuki</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>C-T</fnm>
               </au>
               <au>
                  <snm>Miwa</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wakao</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Iki</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Oyaizu</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>2007</pubdate>
            <volume>73</volume>
            <fpage>6650</fpage>
            <lpage>6659</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">2075074</pubid>
                  <pubid idtype="pmpid" link="fulltext">17720818</pubid>
                  <pubid idtype="doi">10.1128/AEM.01514-07</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>Evidence for functional differentiation of duplicated <it>nifH </it>genes in <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Iki</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Aono</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Oyaizu</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>FEMS Microbiol Lett</source>
            <pubdate>2007</pubdate>
            <volume>274</volume>
            <fpage>173</fpage>
            <lpage>179</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1574-6968.2007.00823.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">17651409</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>The genome of <it>Rhizobium leguminosarum </it>has recognizable core and accessory components</p>
            </title>
            <aug>
               <au>
                  <snm>Young</snm>
                  <fnm>JPW</fnm>
               </au>
               <au>
                  <snm>Crossman</snm>
                  <fnm>LC</fnm>
               </au>
               <au>
                  <snm>Johnston</snm>
                  <fnm>AWB</fnm>
               </au>
               <au>
                  <snm>Thomson</snm>
                  <fnm>NR</fnm>
               </au>
               <au>
                  <snm>Ghazoui</snm>
                  <fnm>ZF</fnm>
               </au>
               <au>
                  <snm>Hull</snm>
                  <fnm>KH</fnm>
               </au>
               <au>
                  <snm>Wexler</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Curson</snm>
                  <fnm>ARJ</fnm>
               </au>
               <au>
                  <snm>Todd</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Poole</snm>
                  <fnm>PS</fnm>
               </au>
               <au>
                  <snm>Mauchline</snm>
                  <fnm>TH</fnm>
               </au>
               <au>
                  <snm>East</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Quail</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Churcher</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Arrowsmith</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Cherevach</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Chillingworth</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Clarke</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Cronin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Fraser</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hance</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Hauser</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Jagels</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Moule</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mungall</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Norbertczak</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Rabbinowitsch</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Sanders</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Simmonds</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Whitehead</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Parkhill</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>R34.1</fpage>
            <lpage>R34.20</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1186/gb-2006-7-4-r34</pubid>
                  <pubid idtype="pmpid" link="fulltext">16640791</pubid>
                  <pubid idtype="pmcid">1557990</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B61">
            <title>
               <p>Three phylogenetic groups of <it>nodA </it>and <it>nifH </it>genes in <it>Sinorhizobium </it>and <it>Mesorhizobium </it>isolates from leguminous trees growing in Africa and Latin America</p>
            </title>
            <aug>
               <au>
                  <snm>Haukka</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Lindstr&#246;m</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>JPW</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>1998</pubdate>
            <volume>64</volume>
            <fpage>419</fpage>
            <lpage>426</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">106060</pubid>
                  <pubid idtype="pmpid" link="fulltext">9464375</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B62">
            <title>
               <p>DNA sequence of the common nodulation genes of <it>Bradyrhizobium elkanii </it>and their phylogenetic relationship to those of other nodulating bacteria</p>
            </title>
            <aug>
               <au>
                  <snm>Dobert</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Breil</snm>
                  <fnm>BT</fnm>
               </au>
               <au>
                  <snm>Triplett</snm>
                  <fnm>EW</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1994</pubdate>
            <volume>7</volume>
            <fpage>564</fpage>
            <lpage>572</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmpid">7949325</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B63">
            <title>
               <p>Phylogeny of Sym plasmids of rhizobia by PCR-based sequencing of a <it>nodC </it>segment</p>
            </title>
            <aug>
               <au>
                  <snm>Ueda</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Suga</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yahiro</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Matsuguchi</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1995</pubdate>
            <volume>177</volume>
            <fpage>468</fpage>
            <lpage>472</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">176613</pubid>
                  <pubid idtype="pmpid" link="fulltext">7814339</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B64">
            <title>
               <p>A locus encoding host range is linked to the common nodulation genes of <it>Bradyrhizobium japonicum</it></p>
            </title>
            <aug>
               <au>
                  <snm>Nieuwkoop</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Banfalvi</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Deshmane</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Gerhold</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Schell</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Sirotkin</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Stacey</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1987</pubdate>
            <volume>169</volume>
            <fpage>2631</fpage>
            <lpage>2638</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">212140</pubid>
                  <pubid idtype="pmpid" link="fulltext">3584066</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>Identification of <it>nodS </it>and <it>nodU</it>, two inducible genes inserted between the <it>Bradyrhizobium japonicum nodYABC </it>and <it>nodIJ </it>genes</p>
            </title>
            <aug>
               <au>
                  <snm>G&#246;ttfert</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hitz</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hennecke</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Mol Plant-Microbe Interact</source>
            <pubdate>1990</pubdate>
            <volume>3</volume>
            <fpage>308</fpage>
            <lpage>316</lpage>
            <xrefbib>
               <pubid idtype="pmpid">2134855</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>Specific flavonoids stimulate intercellular colonization of non-legumes by <it>Azorhizobium caulinodans</it></p>
            </title>
            <aug>
               <au>
                  <snm>Gough</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Webster</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Vasse</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Galera</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Batchelor</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>O'Callaghan</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Davey</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kothari</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>D&#233;nari&#233;</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Cocking</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>The Biology of Plant-Microbe Interactions</source>
            <publisher>St. Paul: International Society of Plant-Microbe Interactions</publisher>
            <editor>Stacey G, Mullin B, Gresshoff P</editor>
            <pubdate>1996</pubdate>
            <fpage>409</fpage>
            <lpage>415</lpage>
         </bibl>
         <bibl id="B67">
            <title>
               <p>Survival of <it>Azorhizobium caulinodans </it>in the soil and rhizosphere of wetland rice under <it>Sesbania rostrata</it>-rice rotation</p>
            </title>
            <aug>
               <au>
                  <snm>Ladha</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Garcia</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Miyan</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Padre</snm>
                  <fnm>AT</fnm>
               </au>
               <au>
                  <snm>Watanabe</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Appl Environ Microbiol</source>
            <pubdate>1989</pubdate>
            <volume>55</volume>
            <fpage>454</fpage>
            <lpage>460</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">184130</pubid>
                  <pubid idtype="pmpid" link="fulltext">16347853</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>Establishment of <it>Azorhizobium caulinodans </it>in the rhizosphere of wetland rice (<it>Oryza sativa </it>L.)</p>
            </title>
            <aug>
               <au>
                  <snm>Van Nieuwenhove</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>van Holm</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Kulasooriya</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Vlassak</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Biol Fertil Soils</source>
            <pubdate>2000</pubdate>
            <volume>31</volume>
            <fpage>143</fpage>
            <lpage>149</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/s003740050637</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p>Assembling genomic DNA sequences with PHRAP</p>
            </title>
            <aug>
               <au>
                  <snm>de la Bastide</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>McCombie</snm>
                  <fnm>WR</fnm>
               </au>
            </aug>
            <source>Current Protocols in Bioinformatics</source>
            <publisher>New York: John Wiley &amp; Sons</publisher>
            <editor>Baxevanis AD</editor>
            <pubdate>2007</pubdate>
            <issue>Supplement 17</issue>
            <note>Unit 11.4.</note>
         </bibl>
         <bibl id="B70">
            <title>
               <p>Base-calling of automated sequencer traces using <it>Phred</it>. I. Accuracy assessment</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wendl</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>175</fpage>
            <lpage>185</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521921</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>Base-calling of automated sequencer traces using <it>phred</it>. II. Error probabilities</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>186</fpage>
            <lpage>194</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521922</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>Improved microbial gene identification with GLIMMER</p>
            </title>
            <aug>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Harmon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kasif</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1999</pubdate>
            <volume>27</volume>
            <fpage>4636</fpage>
            <lpage>4641</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">148753</pubid>
                  <pubid idtype="pmpid" link="fulltext">10556321</pubid>
                  <pubid idtype="doi">10.1093/nar/27.23.4636</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>Basic local alignment search tool</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Gish</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1990</pubdate>
            <volume>215</volume>
            <fpage>403</fpage>
            <lpage>410</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">2231712</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B74">
            <title>
               <p>The MetaCyc database</p>
            </title>
            <aug>
               <au>
                  <snm>Karp</snm>
                  <fnm>PD</fnm>
               </au>
               <au>
                  <snm>Riley</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Paley</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Pellegrini-Toole</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2002</pubdate>
            <volume>30</volume>
            <fpage>59</fpage>
            <lpage>61</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">99148</pubid>
                  <pubid idtype="pmpid" link="fulltext">11752254</pubid>
                  <pubid idtype="doi">10.1093/nar/30.1.59</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B75">
            <title>
               <p>The NCBI Microbial Genome Resource Database</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/genomes/MICROBES/microbial_taxtree.html</url>
         </bibl>
         <bibl id="B76">
            <title>
               <p>A simple, fast, and accurate algorithm to estimate large phylogenies by maximum likelihood</p>
            </title>
            <aug>
               <au>
                  <snm>Guindon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gascuel</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Syst Biol</source>
            <pubdate>2003</pubdate>
            <volume>52</volume>
            <fpage>696</fpage>
            <lpage>704</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1080/10635150390235520</pubid>
                  <pubid idtype="pmpid">14530136</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B77">
            <title>
               <p>A general empirical model of protein evolution derived from multiple protein families using a maximum-likelihood approach</p>
            </title>
            <aug>
               <au>
                  <snm>Whelan</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Goldman</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2001</pubdate>
            <volume>18</volume>
            <fpage>691</fpage>
            <lpage>699</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11319253</pubid>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
