<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-7-173</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>Complete genome sequence of <it>Shigella flexneri </it>5b and comparison with <it>Shigella flexneri </it>2a</p>
         </title>
         <aug>
            <au id="A1" ce="yes">
               <snm>Nie</snm>
               <fnm>Huan</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>nh121212@hotmail.com</email>
            </au>
            <au id="A2" ce="yes">
               <snm>Yang</snm>
               <fnm>Fan</fnm>
               <insr iid="I2"/>
               <email>ymf129@vip.sina.com</email>
            </au>
            <au id="A3" ce="yes">
               <snm>Zhang</snm>
               <fnm>Xiaobing</fnm>
               <insr iid="I2"/>
               <email>bbbzhang@sina.com</email>
            </au>
            <au id="A4" ce="yes">
               <snm>Yang</snm>
               <fnm>Jian</fnm>
               <insr iid="I2"/>
               <email>yang@chgb.org.cn</email>
            </au>
            <au id="A5">
               <snm>Chen</snm>
               <fnm>Lihong</fnm>
               <insr iid="I2"/>
               <email>chen@chgb.org.cn</email>
            </au>
            <au id="A6">
               <snm>Wang</snm>
               <fnm>Jing</fnm>
               <insr iid="I2"/>
               <email>wwangjing@gmail.com</email>
            </au>
            <au id="A7">
               <snm>Xiong</snm>
               <fnm>Zhaohui</fnm>
               <insr iid="I2"/>
               <email>xiongsimon@163.com</email>
            </au>
            <au id="A8">
               <snm>Peng</snm>
               <fnm>Junping</fnm>
               <insr iid="I2"/>
               <email>pengjp@hotmail.com</email>
            </au>
            <au id="A9">
               <snm>Sun</snm>
               <fnm>Lilian</fnm>
               <insr iid="I2"/>
               <email>ll_sun@btamail.net.cn</email>
            </au>
            <au id="A10">
               <snm>Dong</snm>
               <fnm>Jie</fnm>
               <insr iid="I2"/>
               <email>zhh@crland.com.cn</email>
            </au>
            <au id="A11">
               <snm>Xue</snm>
               <fnm>Ying</fnm>
               <insr iid="I2"/>
               <email>yylhu@sina.com</email>
            </au>
            <au id="A12">
               <snm>Xu</snm>
               <fnm>Xingye</fnm>
               <insr iid="I2"/>
               <email>xyz810214@sina.com</email>
            </au>
            <au id="A13">
               <snm>Chen</snm>
               <fnm>Shuxia</fnm>
               <insr iid="I2"/>
               <email>chenshuxia_2005@163.com</email>
            </au>
            <au id="A14">
               <snm>Yao</snm>
               <fnm>Zhijian</fnm>
               <insr iid="I3"/>
               <email>yaozj@mx.cei.gov.cn</email>
            </au>
            <au id="A15">
               <snm>Shen</snm>
               <fnm>Yan</fnm>
               <insr iid="I3"/>
               <email>sheny@cdm.imicams.ac.cn</email>
            </au>
            <au id="A16" ca="yes">
               <snm>Jin</snm>
               <fnm>Qi</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <insr iid="I4"/>
               <email>zdsys@sina.com</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>College of Biological Sciences China Agricultural University, Beijing 100094, China</p>
            </ins>
            <ins id="I2">
               <p>State Key Laboratory for Molecular Virology and Genetic Engineering, Beijing 100052, China</p>
            </ins>
            <ins id="I3">
               <p>National Center of Human Genome Research, Beijing 100176, China</p>
            </ins>
            <ins id="I4">
               <p>Institute of Pathogen Biology, Chinese Academy of Medical Sciences, Beijing 100730, China</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2006</pubdate>
         <volume>7</volume>
         <issue>1</issue>
         <fpage>173</fpage>
         <url>http://www.biomedcentral.com/1471-2164/7/173</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">16822325</pubid>
               <pubid idtype="doi">10.1186/1471-2164-7-173</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>28</day>
               <month>2</month>
               <year>2006</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>06</day>
               <month>7</month>
               <year>2006</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>06</day>
               <month>7</month>
               <year>2006</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2006</year>
         <collab>Nie et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p><it>Shigella </it>bacteria cause dysentery, which remains a significant threat to public health. <it>Shigella flexneri </it>is the most common species in both developing and developed countries. Five <it>Shigella </it>genomes have been sequenced, revealing dynamic and diverse features. To investigate the intra-species diversity of <it>S. flexneri </it>genomes further, we have sequenced the complete genome of <it>S. flexneri </it>5b strain 8401 (abbreviated Sf8401) and compared it with <it>S. flexneri </it>2a (Sf301).</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The Sf8401 chromosome is 4.5-Mb in size, a little smaller than that of Sf301, mainly because the former lacks the SHI-1 pathogenicity island (PAI). Compared with Sf301, there are 6 inversions and one translocation in Sf8401, which are probably mediated by insertion sequences (IS). There are clear differences in the known PAIs between these two genomes. The bacteriophage SfV segment remaining in SHI-O of Sf8401 is clearly larger than the remnants of bacteriophage SfII in Sf301. SHI-1 is absent from Sf8401 but a specific related protein is found next to the <it>pheV </it>locus. SHI-2 is involved in one intra-replichore inversion near the origin of replication, which may change the expression of <it>iut/iuc </it>genes. Moreover, genes related to the glycine-betaine biosynthesis pathway are present only in Sf8401 among the known <it>Shigella </it>genomes.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>Our data show that the two <it>S. flexneri </it>genomes are very similar, which suggests a high level of structural and functional conservation between the two serotypes. The differences reflect different selection pressures during evolution. The ancestor of <it>S. flexneri </it>probably acquired SHI-1 and SHI-2 before SHI-O was integrated and the serotypes diverged. SHI-1 was subsequently deleted from the <it>S. flexneri </it>5b genome by recombination, but stabilized in the <it>S. flexneri </it>2a genome. These events may have contributed to the differences in pathogenicity and epidemicity between the two serotypes of <it>S. flexneri</it>.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="bmc" subtype="user_supplied_xml" id="endnote"/>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p><it>Shigella </it>species that cause bacillary dysentery or shigellosis are Gram-negative, non-sporulating, facultative anaerobes, and the disease remains a major worldwide health problem. An estimated annual infection of 160 million individuals, with 1.1 million deaths, most of them children under 5 years old in developing countries, occurs with shigellosis <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. The poor sanitary conditions prevalent in these areas contribute to the spread of the bacteria, and the expense of antibiotics and increasing antibiotic resistance complicate treatment <abbrgrp><abbr bid="B2">2</abbr></abbrgrp>.</p>
         <p><it>Shigella </it>was recognized as the etiological agent of bacillary dysentery in the 1890s. It was adopted as a genus in the 1950s and sub-divided into 4 species: <it>S. dysenteriae, S. flexneri, S. boydii and S. sonnei </it><abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. According to this taxonomy,<it>S. flexneri </it>is classified into 6 serotypes (including 13 subtypes). Most previous work on the molecular pathogenesis of <it>Shigella </it>has been carried out in <it>S. flexneri </it>serotypes 2a and 5.</p>
         <p>In China, <it>S. flexneri </it>2a is a hyperendemic species and is responsible for approximately 50&#8211;70% of >10 million cases per year, most of them associated with epidemic and pandemic shigellosis <abbrgrp><abbr bid="B4">4</abbr></abbrgrp>. <it>Shigella </it>pathologically invades the intestinal epithelial cells, resulting in an intense inflammatory reaction characterized by abscess formation and ulceration. All <it>Shigella </it>strains contain a large virulence plasmid that is known to encode genes necessary and sufficient for invasion <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. The virulence plasmid from <it>S. flexneri </it>serotype 2a diverges slightly from serotype 5a <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>, but the epidemicities of the two serotypes differ markedly. Chromosomal genes present in "pathogenicity islands" usually participate in the pathogenic process directly, or contribute to survival in the host environments during infection <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>, and the expression of virulence depends on a complex regulation mechanism that involves dialog between the chromosome and the virulence plasmid <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>.</p>
         <p>We and others have previously sequenced two genomes of the most prevalent species <it>S. flexneri </it>2a (strains Sf301 and 2457T) and also completed the genomes from the other three species of <it>Shigella </it><abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. All these genomes show that the extensive diversity of <it>Shigella </it>is perhaps attributable to the fact that the bacteria evolved from different strains of <it>E. coli </it>and became highly specific human pathogens through convergent evolution. A better understanding of the intra-species diversity of <it>Shigella </it>requires the availability of more whole genome sequences.</p>
         <p>We present here the complete genome sequence of <it>S. flexneri </it>5b Sf8401 and a comparison with the <it>S. flexneri </it>2a Sf301 genome, which reveals differences in the pathogenicity islands and chromosomal rearrangements between different serotypes of this species. The comparison will facilitate understanding of the common biological processes required for infection and identify unique properties that may differentiate between them in respect of epidemicity and pathogenicity, even if the virulence plasmid is closely similar. Moreover, the comparison will provide some insight into how these pathogens have evolved.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>General features</p>
            </st>
            <p>In common with other reported <it>Shigella </it>strains, the genome of Sf8401 contains a circular chromosome. Since the complete sequences of pWR501 and pWR100 are known <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp>, we present here only the chromosome sequence, which is 4,574,284 bp in length with an average GC content of 50.92% and encodes 97 tRNA genes (Table <tblr tid="T1">1</tblr>, <supplr sid="S1">Additional file 1</supplr>). Its size is a little smaller than that of Sf301, mainly because SHI-1 is absent (see below). Sf8401 has 7 rRNA operons, with 4 copies in one replichore and 3 in the other, while Sf301 has 5 copies in one replichore and 2 in the other. These result from one intra-replichore inversion near the replication origin (Fig. <figr fid="F1">1</figr>). Comparison of Sf8401 with Sf301 reveals that more than 97% of the genome sequence is shared between the two strains. The architecture of the Sf8401 genome is similar to Sf301 but the overall colinearity is broken by 7 translocations and inversions involving DNA segments >5 kb (Fig. <figr fid="F1">1</figr>). Among the 4194 proteomes of MG1655, 3098 proteins (74%) are shared by Sf8401 and Sf301 and may be regarded as the "backbone" of <it>S. flexneri </it>(<supplr sid="S2">Additional file 2</supplr>), while 114 are pseudogenes in both genomes. Two hundred and sixty-six of the 1096 non-backbone proteins were predicted to be metabolism-related by the Clusters of Orthologous Groups (COGs) database. This reflects the evolution of <it>S. flexneri </it>from a non-pathogenic <it>E. coli </it>ancestor to a facultative intracellular pathogen. Among the 393 Sf8401 specific proteins (compared with MG1655) only 28 are specific to all known <it>Shigella </it>genomes; most of them are bacteriophage-related proteins or hypothetical proteins (<supplr sid="S3">Additional file 3</supplr>).</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>General features of the <it>Shigella </it>genomes compared with the genome of <it>E. coli </it>K12 MG1655</p>
               </caption>
               <tblbdy cols="7">
                  <r>
                     <c ca="center">
                        <p>
                           <b>Chromosome</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>MG1655*</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Sd197&#8224; </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Sf301&#8224; </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Sf8401</b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Sb227&#8224; </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Ss046&#8224; </b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="7">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>Total length (bp)</p>
                     </c>
                     <c ca="center">
                        <p>4,639,675</p>
                     </c>
                     <c ca="center">
                        <p>4,369,232</p>
                     </c>
                     <c ca="center">
                        <p>4,607,203</p>
                     </c>
                     <c ca="center">
                        <p>4,574,284</p>
                     </c>
                     <c ca="center">
                        <p>4,519,823</p>
                     </c>
                     <c ca="center">
                        <p>4,825,265</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>No. of total ORFs</p>
                     </c>
                     <c ca="center">
                        <p>4,254</p>
                     </c>
                     <c ca="center">
                        <p>4,557</p>
                     </c>
                     <c ca="center">
                        <p>4,434</p>
                     </c>
                     <c ca="center">
                        <p>4,316</p>
                     </c>
                     <c ca="center">
                        <p>4,353</p>
                     </c>
                     <c ca="center">
                        <p>4,434</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>No. of pseudogenes</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>285</p>
                     </c>
                     <c ca="center">
                        <p>254</p>
                     </c>
                     <c ca="center">
                        <p>198</p>
                     </c>
                     <c ca="center">
                        <p>217</p>
                     </c>
                     <c ca="center">
                        <p>210</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>Percentage of CDS (%)</p>
                     </c>
                     <c ca="center">
                        <p>87.3</p>
                     </c>
                     <c ca="center">
                        <p>77.2</p>
                     </c>
                     <c ca="center">
                        <p>80.4</p>
                     </c>
                     <c ca="center">
                        <p>80.8</p>
                     </c>
                     <c ca="center">
                        <p>80.5</p>
                     </c>
                     <c ca="center">
                        <p>80.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>G+C content (%)</p>
                     </c>
                     <c ca="center">
                        <p>50.79</p>
                     </c>
                     <c ca="center">
                        <p>51.25</p>
                     </c>
                     <c ca="center">
                        <p>50.89</p>
                     </c>
                     <c ca="center">
                        <p>50.92</p>
                     </c>
                     <c ca="center">
                        <p>51.21</p>
                     </c>
                     <c ca="center">
                        <p>51.01</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>No. of 16S/23S/5S</p>
                     </c>
                     <c ca="center">
                        <p>7/7/8</p>
                     </c>
                     <c ca="center">
                        <p>7/7/8</p>
                     </c>
                     <c ca="center">
                        <p>7/7/8</p>
                     </c>
                     <c ca="center">
                        <p>7/7/8</p>
                     </c>
                     <c ca="center">
                        <p>7/7/8</p>
                     </c>
                     <c ca="center">
                        <p>7/7/8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>No. transfer RNA</p>
                     </c>
                     <c ca="center">
                        <p>86</p>
                     </c>
                     <c ca="center">
                        <p>85</p>
                     </c>
                     <c ca="center">
                        <p>97</p>
                     </c>
                     <c ca="center">
                        <p>97</p>
                     </c>
                     <c ca="center">
                        <p>91</p>
                     </c>
                     <c ca="center">
                        <p>97</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>IS elements (percentage)</p>
                     </c>
                     <c ca="center">
                        <p>44 (1%)</p>
                     </c>
                     <c ca="center">
                        <p>623 (12%)</p>
                     </c>
                     <c ca="center">
                        <p>314 (7%)</p>
                     </c>
                     <c ca="center">
                        <p>278 (6.3%)</p>
                     </c>
                     <c ca="center">
                        <p>403 (9%)</p>
                     </c>
                     <c ca="center">
                        <p>394 (8%)</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>* Data are obtained from a recently updated version of U00096.</p>
                  <p>&#8224; Data are obtained from ref.[14].</p>
               </tblfn>
            </tbl>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p><b>Circular genome map of the Sf8401 genome</b>. The outer scale is marked every 200 kb. Circles range from 1 (outer circle) to 9 (inner circle). Circles 1 and 2, ORFs encoded by leading and lagging strands respectively, with color code for functions: salmon, translation, ribosomal structure and biogenesis; light blue, transcription; cyan, DNA replication, recombination and repair; turquoise, cell division; deep pink, post-translational modification, protein turnover and chaperones; olive drab, cell envelope biogenesis; purple, cell motility and secretion; forest green, inorganic ion transport and metabolism; magenta, signal transduction; red, energy production; sienna, carbohydrate transport and metabolism; yellow, amino acid transport; orange, nucleotide transport and metabolism; gold, co-enzyme transport and metabolism; dark blue, lipid metabolism; blue, secondary metabolites, transport and catabolism; gray, general function prediction only; black, function unclassified or unknown. Circle 3, distribution of pseudogenes. Circles 4 and 5, distributions of IS1/IS1N and other IS-species respectively. Circles 6 and 7, G+C content and GC skew (G-C/G+C) respectively with a window size of 10 kb. Circles 8 and 9, distributions of tRNA genes and <it>rrn </it>operons respectively. The replication origin and terminus are indicated.</p>
               </text>
               <file name="1471-2164-7-173-S1.jpeg">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Global comparison of Sf8401 chromosome with Sf301</p>
               </caption>
               <text>
                  <p><b>Global comparison of Sf8401 chromosome with Sf301</b>. Each marker length denotes 300 kb for chromosome comparisons. Color code denotes maximal length of the paired segments: red, >10 kb; blue, 5~10 kb; cyan, 1~5 kb. The inversion is abbreviated to IV.</p>
               </text>
               <graphic file="1471-2164-7-173-1"/>
            </fig>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p><b>Orthologs of the MG1655 proteomes in Sf8401 and Sf301</b>. 4194 proteins of MG1655 are selected to study their orthologs in Sf8401 and Sf301.</p>
               </text>
               <file name="1471-2164-7-173-S2.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p><b>Orthologs of Sf8401 specific proteins (relative to MG1655) in other <it>Shigella </it>genomes</b>. This gives the full list of 393 Sf8401-specific proteins relative to MG1655 and their orthologs in other <it>Shigella </it>genomes.</p>
               </text>
               <file name="1471-2164-7-173-S3.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>IS elements are ubiquitous in bacterial genomes and important factors in evolution <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>. The IS insertion can cause gene inactivation, activate cryptic genes or alter the expression of adjacent genes <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. The numbers and species of IS elements in the Sf8401 genome are similar to previously-determined <it>Shigella </it>genomes. In total, the IS elements encode 485 ORFs and make up 6.37% (291.3 kb) of the chromosome, and the predominant species is IS1. A distinct difference is that Sf301 has 13 copies of iso-IS10R, while Sf8401 and other sequenced <it>Shigella </it>chromosomes have not. This might be used as a marker for epidemiological studies. Furthermore, IS elements are capable of causing various genetic rearrangements such as deletions, inversions and translocations <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. Unlike the inversion reported in <it>Yersinia pestis </it><abbrgrp><abbr bid="B21">21</abbr></abbrgrp>, <it>S. enterica serovar </it>Typhi <abbrgrp><abbr bid="B22">22</abbr></abbrgrp> and <it>E. coli </it>K-12 strain W3110 <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B23">23</abbr></abbrgrp>, which are associated with rRNA homologies, inversions in Sf8401 are probably mediated by IS elements. Inversions 1 and 5 (Fig. <figr fid="F1">1</figr>) occur around SHI-O and SHI-2, which are mediated by IS629 and IS1. Besides these major inversions, there are other four inverted regions, inversions 2, 3, 4 and 6 (Fig. <figr fid="F1">1</figr>), which are probably mediated by IS4, IS<it>Sfl2</it>, IS600 and IS1 respectively.</p>
         </sec>
         <sec>
            <st>
               <p>Diversity of SHI-O</p>
            </st>
            <p>LPS is an important virulence factor in <it>Shigella </it><abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. Since the immune response to <it>Shigella </it>spp. is O-antigen specific, an immune response to a specific O antigen does not protect against infection with other serotypes. Therefore, the capacity to alter serotypes may be advantageous for <it>Shigella </it>spp. in the infectious process <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. In Sf8401, the serotype conversion region, i.e. SHI-O <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>, is located around 300 kb (Fig. <figr fid="F1">1</figr>). In SHI-O the 3 genes termed <it>gtrA</it>, <it>gtrB </it>and <it>gtrV </it>(a serotype-specific glycosyltransferase) are putatively involved in glucosylation reactions <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. The mean GC content of <it>gtrA </it>and <it>gtrB </it>is 42.71%, and the GC content of <it>gtrV </it>is 32.99%. All three are lower than the whole genome GC content (50.92%). Compared with Sf301, <it>gtrA </it>and <it>gtrB </it>are highly conserved and interchangeable among serotypes, whereas <it>gtr </it>(serotype) appears to be unique to each bacteriophage <abbrgrp><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr></abbrgrp>, which indicates that these genes have been acquired from lysogeny caused by bacteriophages.</p>
            <p>The SHI-O component differs between Sf301 and Sf8401 (Fig. <figr fid="F2">2a</figr>). Although type II antigen is encoded by an inducible bacteriophage, SfII <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>, little genomic sequence of bacteriophage SfII remains in the SHI-O of 2457T and Sf301 except the key genes related to antigenic variation <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. However, the Sf8401 SHI-O includes not only the type V antigen gene, which comes from bacteriophage SfV, but also another 15 kb segment of bacteriophage SfV <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B31">31</abbr></abbrgrp>.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Localized comparison of (a) SHI-O, (b) SHI-1, (c) SHI-2</p>
               </caption>
               <text>
                  <p><b>Localized comparison of (a) SHI-O, (b) SHI-1, (c) SHI-2</b>. Arrows indicate predicted ORFs in both strands. The direction of each arrow predicts the direction of transcription. Color code denotes maximal length of the paired segments: red, >10 kb; blue, 5~10 kb cyan; 1~5 kb. (a) The dark green block refers to a large region of bacteriophage SfV in the Sf8401 genome. (b) The yellow block refers to the 22 bp partial repeat sequence of <it>pheV</it>. Black indicates the 12 kb sequence downstream of SHI-1 in Sf301, which does not exist in Sf8401. The asterisk denotes a pseudogene. (c) The replication origin, <it>ori</it>, is indicated by a vertical arrow in each genome. The green block refers to the region that is colinear with the Sf301 genome.</p>
               </text>
               <graphic file="1471-2164-7-173-2"/>
            </fig>
            <p>Temperate bacteriophages of <it>S. flexneri </it>play an important role in serotype conversion. Bacteriophages SfV and SfII encode the factors involved in glucosylation of the O-antigen, and lysogenization results in conversion of serotype Y strains to serotypes 5 and 2 <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B30">30</abbr></abbrgrp>. The defining point for evolution of <it>S. flexneri </it>2 and 5 from the <it>S. flexneri </it>ancestor is probably the acquisition of the precursor of the current-day O-antigen modification genes. It can be supposed that the <it>S. flexneri </it>ancestor acquired diverse O-antigen modification genes along with related bacteriophage sequences when the bacteriophages were integrated into the bacterial genomes. The genome rearrangements caused by IS elements in far-flung evolutional processes have interrupted these bacteriophage sequences in many <it>Shigella </it>genomes. However, there are ~15 kb of bacteriophage SfV sequence remnants in Sf8401, though far less bacteriophage SfII sequence has remained in Sf301. This might be because the Sf8401 genome is less dynamic than that of Sf301, or alternatively, it may suggest that Sf8401 arose later than Sf301. This hypothesis requires further investigation.</p>
         </sec>
         <sec>
            <st>
               <p>Absence of SHI-1</p>
            </st>
            <p><it>Shigella </it>pathogenicity island SHI-1 encodes three characterized proteins: SigA, Pic and the enterotoxin ShET1. Functional analysis shows that SigA is cytopathic for HEp-2 cells and at least partly responsible for the ability of <it>S. flexneri </it>to stimulate fluid accumulation in ligated rabbit ileal loops <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. The Pic protein, a serine protease, is involved in mucinase activity, serum resistance and hemagglutination <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. Furthermore, ShET1 encoded by <it>set1A </it>and <it>set1B </it>could increase fluid accumulation in the rabbit loop model.</p>
            <p>SHI-1 is located directly downstream of the <it>pheV </it>tRNA gene and includes an imperfect repeat of the 3'-end 22 bp of the <it>pheV </it>gene at the right boundary in Sf301 (Fig. <figr fid="F2">2b</figr>). Studies of SHI-1 distribution (<it>she </it>PAI) show that intact SHI-1 is present in all tested serotype 2a strains of <it>S. flexneri </it>but absent from some <it>S. flexneri </it>serotype strains such as 1a, 1b, 3b, 4 and 5 <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. It is therefore not surprising that SHI-1 is wholly absent from Sf8401. However, the homolog of SF3004, a hypothetical protein located downstream of SHI-1 in Sf301, is situated next to the <it>pheV </it>gene in Sf8401 (SFV3027). Further investigation shows that the homolog of SF3004 is only present adjacent to SHI-1 in the Sf301 and 2457T genomes and the <it>S. flexneri </it>2a <it>she </it>pathogenicity island <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>. So the presence of SFV3027 suggests that Sf8401 might have contained SHI-1 during its evolutionary history but lost it for unknown reasons. Sakellaris et al. <abbrgrp><abbr bid="B33">33</abbr></abbrgrp> demonstrated that the spontaneous and precise excision of SHI-1 can occur via recombination between a 22 bp sequence at the 3' terminus of <it>pheV </it>and an imperfect direct repeat at the <it>pheV</it>-distal boundary of the SHI-1. Thus, we have probably witnessed the case in Sf8401. Undoubtedly, the mechanism by which SHI-1 is stabilized in <it>S. flexneri </it>2a strains will be an interesting focus for further studies.</p>
         </sec>
         <sec>
            <st>
               <p>Inversion of SHI-2</p>
            </st>
            <p>SHI-2 encodes the synthesis and transport of aerobactin, a hydroxamate siderophore associated with increased virulence in enteric bacteria <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B34">34</abbr></abbrgrp>, and is located downstream of the <it>selC </it>tRNA gene in Sf8401. The conservation of the component, organization and integration site of SHI-2 in Sf301 and Sf8401 implies that it was acquired by the <it>S. flexneri </it>ancestor before the serotypes diverged. However, the <it>iut</it>/<it>iuc </it>operon is located on the leading strand and on the counter-clockwise site of the replication origin in Sf301, but on the lagging strand and on the clockwise site in Sf8401 (Fig. <figr fid="F2">2c</figr>). Our previous genome studies revealed that SHI-2 in <it>S. sonnei </it>Ss046 was unlinked with the <it>selC </it>gene by an inversion, and SHI-3 of <it>S. boydii </it>Sb227 that carries a similar <it>iut</it>/<it>iuc </it>operon is linked with the <it>pheU </it>tRNA locus <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. So in view of this information, the observation that the <it>iut</it>/<it>iuc </it>operon can inserted into a variety of different loci suggests that it is highly mobile and may be acquired by additional human or animal pathogens <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>.</p>
            <p>In Sf8401, SHI-2 is involved in inversion 5 that spans <it>oriC </it>(Fig. <figr fid="F1">1</figr>). All sequenced <it>Shigella </it>chromosomes have inversions at <it>oriC </it>and <it>terC</it>, which is suggested to be a common evolutionary feature of bacterial genomes <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. In contrast to Sf301, inversion 5 is found from 3597 to 4100 kb in Sf8401, which appears to be mediated by the boundary IS1 copies in Sf8401 (Fig. <figr fid="F2">2c</figr>). However, the ~22 kb center region of inversion 5 that covers <it>oriC </it>retains colinearity with that of Sf301 (Fig. <figr fid="F2">2c</figr>; the block colored green). Since this region is sandwiched between two copies of IS4, it implies that two or more inversions have occurred: an inversion was followed by a re-inversion to restore colinearity.</p>
            <p>Inversions can produce an "X" shape, which changes the positions of these sequences from their natural locations <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>, and the distance from the <it>iut/iuc </it>operon to <it>oriC </it>in Sf8401 is different from that in Sf301 due to inversion 5 and the internal re-inversion mentioned above. Owing to bidirectional replication, there are extra copies of genes close to <it>oriC</it>, resulting in increased gene expression <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>, and since dosage differences may cause the strengths of promoters to be evolutionarily optimized for their specific positions, cells in which genes are a different distance from <it>oriC </it>are at a selective disadvantage <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. Hence, whether the change in position of the <it>iut/iuc </it>operon in Sf8401 has any influence on expression needs to be determined.</p>
         </sec>
         <sec>
            <st>
               <p>Differences among genes correlated with metabolism</p>
            </st>
            <p>The <it>E. coli bet </it>gene cluster (<it>betABIT</it>) contributes to the pathway for glycine-betaine biosynthesis from choline <abbrgrp><abbr bid="B38">38</abbr></abbrgrp> and is located close to SHI-O in Sf8401 but absent from Sf301 and 2457T. Among eubacteria-compatible solutes, the most widespread is glycine-betaine, and this is the only osmoprotectant synthesized by <it>E. coli </it><abbrgrp><abbr bid="B39">39</abbr><abbr bid="B40">40</abbr></abbrgrp>. The choline-glycine-betaine pathway confers a high level of osmotic tolerance on <it>E. coli </it><abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. Whether this system offers an advantage to <it>S. flexneri </it>5b for environmental survival over <it>S. flexneri </it>2a or plays a role during infection requires further investigation. However, the inversion around the SHI-O may contribute to the deletion of the <it>bet </it>operon from <it>S. flexneri </it>2a (Fig. <figr fid="F2">2a</figr>).</p>
            <p>There are some differences in metabolic and physiological pathways between Sf8401 and Sf301. In both strains, some key metabolic pathways were inactivated by the creation of independent pseudogenes. For instance, the loss of ability to utilize D-sorbitol is due to the inactive states of <it>srlE </it>and <it>srlA </it>in Sf8401 and Sf301, respectively. It seems that <it>Shigella </it>strains have a general tendency to lose some pathways and functions, and this tendency has given rise to convergent evolution <abbrgrp><abbr bid="B41">41</abbr></abbrgrp>. The microorganisms need to adapt to new niches by adopting a strictly pathogenic life-style. There must be some genes that provide little overall selective benefit in a new situation. These genes will be eliminated through mutational bias favoring deletions for the lack of selective force to maintain them <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>. Such functions, no longer active in one serotype but expressed in another, may lead to a better understanding of the diversity of the two serotypes and the evolution of <it>S. flexneri</it>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>As more bacterial genomes have been sequenced during recent years, the study of comparative genomics has progressed rapidly. Although five <it>Shigella </it>genomes have been reported, this is the first time that intra-species diversity has been characterized by comparing the genomes of two different serotypes of the same <it>Shigella </it>species. The comparison between Sf8401 and Sf301 has provided abundant biological and medical information.</p>
         <p>The overall genomic organization, gene order and predicted proteomes of the two genomes are very similar, which suggests a high level of structural and functional conservation between the serotypes. Nevertheless, the colinearity of genome structure between these two serotypes was disrupted by several inversions, and along with the differences found in the known PAIs, these may contribute to differences in epidemicity and virulence between <it>S. flexneri </it>5b and <it>S. flexneri </it>2a.</p>
         <p><it>S. flexneri </it>5b and <it>S. flexneri </it>2a have experienced different selection pressures and evolutionary processes. These events (such as inversion, translocation, deletion and acquisition) have led to the diversity of SHI-O, the absence of SHI-1, the shift of SHI-2, and other differences between these two genomes. They have extensively reshaped the genome, presumably virulence to be more fully expressed. It can be supposed that the <it>S. flexneri </it>ancestor had acquired SHI-1 and SHI-2 before divergence, and diverged into different serotypes after the different SHI-Os were integrated. Subsequently, <it>S. flexneri </it>5b deleted SHI-1 via recombination and changed the structure of SHI-2 by inversions, but <it>S. flexneri </it>2a stabilized SHI-1 in its genome. Mechanisms not yet identified have helped to shape the differences between serotypes and led to the derivation of different serotypes from the same parental <it>S. flexneri </it>form. Characterizing the divergence between serotypes at the genetic level helps us to understand the evolution of <it>S. flexneri</it>. The interplay between organizing features of the chromosome, such as the pathogenicity and the elements inducing sequence variation and chromosomal rearrangements, may provide an explanation of why different genomes show such different levels of organization and how this relates to their evolutionary history and ecology.</p>
         <p>In conclusion, by comparing the genomes of Sf8401 and Sf301, a large amount of data has been obtained. It is important in biological and medical research to compare genomes causing similar types of diseases in the same subspecies but different serotypes. The identification of shared traits is important for pathogenicity and for the study of its conservation, transfer, epidemiology, virulence and evolution. Although it is not clear at present whether these similarities and differences are common among <it>S. flexneri</it>, there is a possibility that such events lead to differences in virulence and pathogenicity. Future studies should identify which of the differences in these genomes accounts for the phenotypic differences.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p><it>Shigella flexneri </it>5b strain</p>
            </st>
            <p><it>Shigella flexneri </it>5b, strain 8401, was isolated and sequenced from epidemic in China, kindly provided by the National Institute for Communicable Disease Control and Prevention, Chinese Centre for Disease Control and Prevention.</p>
         </sec>
         <sec>
            <st>
               <p>Shotgun sequencing and analysis</p>
            </st>
            <p>The whole genome sequence shotgun libraries for Sf8401 were established as described previously <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B14">14</abbr></abbrgrp>, and ABI3730 automated sequencers were used for sequence collection. 48,000 clones were sequenced from both ends, giving rise to 8 times coverage of the genome. Sequences were assembled initially using the phred/phrap program with the Q20 criteria <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> when the sequence coverage was ~4-fold over the estimated size of the genome. The Consed program was used for sequence finishing <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>. Gaps among contigs were closed either by primer walking on selected clones, which were identified by analysis on the forward and the reversed links between contigs using a perl/Tk script, or by sequencing the DNA amplicons generated by polymerase chain reaction (PCR). Glimmer 2.0, a program that searches for protein coding regions, was used to identify those ORFs possessing more than 30 consecutive codons <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>. Overlapping and closely clustered ORFs were manually inspected. Predicted polypeptide sequences were used to search the non-redundant protein database with BLASTP, and the clusters of orthologous groups of proteins (COGs) database was used to identify families to which predicted proteins are related <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>. Those cases in which a stop condon or deletion has resulted in an encoded protein that is less than 80% of the length of its counterpart in K-12 genome and those cases in which a frameshift of insertion has altered more than 20% of the amino acid sequence were classed as pseudogenes. Mobile elements and repetitive sequences were identified using the IS FINDER database <abbrgrp><abbr bid="B46">46</abbr></abbrgrp>. GenomeComp was used for genomic comparison with default parameters <abbrgrp><abbr bid="B47">47</abbr></abbrgrp>. The comparison figures used in Figure <figr fid="F1">1</figr> and <figr fid="F2">2</figr> were exported from GenomeComp with a 1500 bp filter setting along with the scale setting of 2000 for chromosomes. The KEGG database was used for the metabolic pathways analysis <abbrgrp><abbr bid="B48">48</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Data accessibility</p>
            </st>
            <p>Complete genome sequence of Sf8401 has been deposited in the Genbank. The accession number for chromosome is: <ext-link ext-link-type="gen" ext-link-id="CP000266">CP000266</ext-link>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>HN, carried out the molecular genetic studies, participated in the sequence alignment and drafted the manuscript. JY, FY, LC performed the statistical analysis and comparative genomic analysis. JY, XZ, JP participated in manuscript preparation. FY, JW, ZX participated in the sequence alignment. LLS, JD, YX, XX, and SC contributed to sample preparation for shotgun sequencing. ZY, YS contributed for design of the manuscript. QJ participated in the design and helped to draft the manuscript. All authors have read and approved the manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We would like to thank Jianguo Xu (CCDC) for providing strains. The work is supported by the State Key Basic Research Program (Grant No. 2005CB522904) and High Technology Project (Grant No. 2004AA223090) from the Ministry of Science and Technology of China.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Global burden of Shigella infections: implications for vaccine development and implementation of control strategies</p>
            </title>
            <aug>
               <au>
                  <snm>Kotloff</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Winickoff</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Ivanoff</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Clemens</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Swerdlow</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Sansonetti</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Adak</snm>
                  <fnm>GK</fnm>
               </au>
               <au>
                  <snm>Levine</snm>
                  <fnm>MM</fnm>
               </au>
            </aug>
            <source>Bull World Health Organ</source>
            <pubdate>1999</pubdate>
            <volume>77</volume>
            <fpage>651</fpage>
            <lpage>666</lpage>
            <xrefbib>
               <pubid idtype="pmpid">10516787</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Slaying the Hydra all at once or head by head?</p>
            </title>
            <aug>
               <au>
                  <snm>Sansonetti</snm>
                  <fnm>PJ</fnm>
               </au>
            </aug>
            <source>Nature Med</source>
            <pubdate>1998</pubdate>
            <volume>4</volume>
            <fpage>499</fpage>
            <lpage>500</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nm0598supp-499</pubid>
                  <pubid idtype="pmpid">9585195</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Genetic basis of virulence in Shigella species</p>
            </title>
            <aug>
               <au>
                  <snm>Hale</snm>
                  <fnm>TL</fnm>
               </au>
            </aug>
            <source>Microbiol Rev</source>
            <pubdate>1991</pubdate>
            <volume>55</volume>
            <fpage>206</fpage>
            <lpage>224</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">372811</pubid>
                  <pubid idtype="pmpid">1886518</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Cloning and application of genus specific DNA probes for Shigella</p>
            </title>
            <aug>
               <au>
                  <snm>Mei</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Chinese J Epidemiol</source>
            <pubdate>1989</pubdate>
            <volume>10</volume>
            <fpage>167</fpage>
            <lpage>170</lpage>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Involvement of a plasmid in the invasive ability of Shigella flexneri</p>
            </title>
            <aug>
               <au>
                  <snm>Sansonetti</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Kopecko</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Formal</snm>
                  <fnm>SB</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>1982</pubdate>
            <volume>35</volume>
            <fpage>852</fpage>
            <lpage>860</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">351125</pubid>
                  <pubid idtype="pmpid">6279518</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>The sigA gene which is borne on the she pathogenicity island of Shigella flexneri 2a encodes an exported cytopathic protease involved in intestinal fluid accumulation</p>
            </title>
            <aug>
               <au>
                  <snm>Al-Hasani</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Henderson</snm>
                  <fnm>IR</fnm>
               </au>
               <au>
                  <snm>Sakellaris</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Rajakumar</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Grant</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nataro</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Robins-Browne</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Adler</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>2000</pubdate>
            <volume>68</volume>
            <issue>5</issue>
            <fpage>2457</fpage>
            <lpage>2463</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">97446</pubid>
                  <pubid idtype="pmpid" link="fulltext">10768931</pubid>
                  <pubid idtype="doi">10.1128/IAI.68.5.2457-2463.2000</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Identification of two Shigella flexneri chromosomal loci involved in intercellular spreading</p>
            </title>
            <aug>
               <au>
                  <snm>Hong</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gleason</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Wyckoff</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Payne</snm>
                  <fnm>SM</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>1998</pubdate>
            <volume>66</volume>
            <fpage>4700</fpage>
            <lpage>4710</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">108578</pubid>
                  <pubid idtype="pmpid" link="fulltext">9746567</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>dksA is required for intercellular spread of Shigella flexneri via an RpoS-independent mechanism</p>
            </title>
            <aug>
               <au>
                  <snm>Mogull</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Runyen-Janecky</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Hong</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Payne</snm>
                  <fnm>SM</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>2001</pubdate>
            <volume>69</volume>
            <fpage>5742</fpage>
            <lpage>5751</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">98691</pubid>
                  <pubid idtype="pmpid" link="fulltext">11500451</pubid>
                  <pubid idtype="doi">10.1128/IAI.69.9.5742-5751.2001</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Characterization of Pic, a secreted protease of Shigella flexneri and enteroaggregative Escherichia coli</p>
            </title>
            <aug>
               <au>
                  <snm>Henderson</snm>
                  <fnm>IR</fnm>
               </au>
               <au>
                  <snm>Czeczulin</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Eslava</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Noriega</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Nataro</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>1999</pubdate>
            <volume>67</volume>
            <fpage>5587</fpage>
            <lpage>5596</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">96930</pubid>
                  <pubid idtype="pmpid" link="fulltext">10531204</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>The aerobactin iron transport system genes in Shigella flexneri are present within a pathogenicity island</p>
            </title>
            <aug>
               <au>
                  <snm>Vokes</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Reeves</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Torres</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Payne</snm>
                  <fnm>SM</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1999</pubdate>
            <volume>33</volume>
            <fpage>63</fpage>
            <lpage>73</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.1999.01448.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">10411724</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Regulation of virulence gene expression in Shigella flexneri, a facultative intracellular pathogen</p>
            </title>
            <aug>
               <au>
                  <snm>Dorma</snm>
                  <fnm>CJ</fnm>
               </au>
               <au>
                  <snm>McKenna</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Beloin</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Int J Med Microbio</source>
            <pubdate>2001</pubdate>
            <volume>290</volume>
            <fpage>89</fpage>
            <lpage>96</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1078/1438-4221-00105</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Genome sequence of Shigella flexneri 2a: insights into pathogenicity through comparison with genomes of Escherichia coli K12 and O157</p>
            </title>
            <aug>
               <au>
                  <snm>Jin</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Yuan</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Shen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Qu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Xue</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kan</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Ding</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cheng</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Yao</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>He</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Qiang</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Wen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Hou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2002</pubdate>
            <volume>30</volume>
            <fpage>4432</fpage>
            <lpage>4441</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">137130</pubid>
                  <pubid idtype="pmpid" link="fulltext">12384590</pubid>
                  <pubid idtype="doi">10.1093/nar/gkf566</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Complete Genome Sequence and Comparative Genomics of Shigella flexneri Serotype 2a Strain 2457T</p>
            </title>
            <aug>
               <au>
                  <snm>Wei</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Goldberg</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>Burland</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Venkatesan</snm>
                  <fnm>MM</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Fournier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Mayhew</snm>
                  <fnm>GF</fnm>
               </au>
               <au>
                  <snm>Plunkett</snm>
                  <fnm>G</fnm>
                  <suf>3rd</suf>
               </au>
               <au>
                  <snm>Rose</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Darling</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mau</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Perna</snm>
                  <fnm>NT</fnm>
               </au>
               <au>
                  <snm>Payne</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Runyen-Janecky</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Schwartz</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Blattner</snm>
                  <fnm>FR</fnm>
               </au>
            </aug>
            <source>InfectImmun</source>
            <pubdate>2003</pubdate>
            <volume>71</volume>
            <fpage>2775</fpage>
            <lpage>2786</lpage>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Genome dynamics and diversity of Shigella species, the etiologic agents of bacillary dysentery</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Jiang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Tang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Xiong</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Xue</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Nie</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Peng</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yuan</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Wen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yao</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Shen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Qiang</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>Q</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <volume>33</volume>
            <issue>19</issue>
            <fpage>6445</fpage>
            <lpage>6458</lpage>
            <note>2005, Nov 7</note>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1278947</pubid>
                  <pubid idtype="pmpid" link="fulltext">16275786</pubid>
                  <pubid idtype="doi">10.1093/nar/gki954</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>The virulence plasmid pWR100 and the repertoire of proteins secreted by the type III secretion apparatus of <it>Shigella flexneri</it></p>
            </title>
            <aug>
               <au>
                  <snm>Buchrieser</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Glaser</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Rusniok</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Nedjari</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>D'Hauteville</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kunst</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Sansonetti</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Parsot</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2000</pubdate>
            <volume>38</volume>
            <fpage>760</fpage>
            <lpage>771</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.2000.02179.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">11115111</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Complete DNA sequence and analysis of the large virulence plasmid of <it>Shigella flexneri</it></p>
            </title>
            <aug>
               <au>
                  <snm>Venkatesan</snm>
                  <fnm>MM</fnm>
               </au>
               <au>
                  <snm>Goldberg</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>Rose</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Grotbeck</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Burland</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Blattner</snm>
                  <fnm>FR</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>2001</pubdate>
            <volume>69</volume>
            <fpage>3271</fpage>
            <lpage>3285</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">98286</pubid>
                  <pubid idtype="pmpid" link="fulltext">11292750</pubid>
                  <pubid idtype="doi">10.1128/IAI.69.5.3271-3285.2001</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Transposable elements and adaptation of host bacteria</p>
            </title>
            <aug>
               <au>
                  <snm>BLOT</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Genetica</source>
            <pubdate>1994</pubdate>
            <volume>93</volume>
            <fpage>5</fpage>
            <lpage>12</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/BF01435235</pubid>
                  <pubid idtype="pmpid">7813917</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>A Rare 920-Kilobase Chromosomal Inversion Mediated by IS1 Transposition Causes Constitutive Expression of the yiaK-S Operon for Carbohydrate Utilization in Escherichia coli</p>
            </title>
            <aug>
               <au>
                  <snm>Badia</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ibanez</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Sabate</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Baldoma</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Aguilar</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>J Biol Chem</source>
            <pubdate>1998</pubdate>
            <volume>273</volume>
            <issue>14</issue>
            <fpage>8376</fpage>
            <lpage>8381</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1074/jbc.273.14.8376</pubid>
                  <pubid idtype="pmpid" link="fulltext">9525947</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Long-term experimental evolution in Escherichia coli. IX. Characterization of insertion sequence-mediated mutations and rearrangements</p>
            </title>
            <aug>
               <au>
                  <snm>Schneider</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Duperchy</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Coursange</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Lenski</snm>
                  <fnm>RE</fnm>
               </au>
               <au>
                  <snm>Blot</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2000</pubdate>
            <volume>156</volume>
            <fpage>477</fpage>
            <lpage>488</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11014799</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>IS1-mediated intramolecular rearrangements: formation of excised transposon circles and replicative deletions</p>
            </title>
            <aug>
               <au>
                  <snm>Turlan</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Chandler</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>EMBO J</source>
            <pubdate>1995</pubdate>
            <volume>14</volume>
            <fpage>5410</fpage>
            <lpage>5421</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">394650</pubid>
                  <pubid idtype="pmpid">7489730</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Genome sequence of Yersinia pestis KIM</p>
            </title>
            <aug>
               <au>
                  <snm>Deng</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Burland</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Plunkett</snm>
                  <fnm>G</fnm>
                  <suf>3rd</suf>
               </au>
               <au>
                  <snm>Boutin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mayhew</snm>
                  <fnm>GF</fnm>
               </au>
               <au>
                  <snm>Liss</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Perna</snm>
                  <fnm>NT</fnm>
               </au>
               <au>
                  <snm>Rose</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Mau</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Schwartz</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Fetherston</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Lindler</snm>
                  <fnm>LE</fnm>
               </au>
               <au>
                  <snm>Brubaker</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Plano</snm>
                  <fnm>GV</fnm>
               </au>
               <au>
                  <snm>Straley</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>McDonough</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Nilles</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Matson</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Blattner</snm>
                  <fnm>FR</fnm>
               </au>
               <au>
                  <snm>Perry</snm>
                  <fnm>RD</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2002</pubdate>
            <volume>184</volume>
            <fpage>4601</fpage>
            <lpage>4611</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">135232</pubid>
                  <pubid idtype="pmpid" link="fulltext">12142430</pubid>
                  <pubid idtype="doi">10.1128/JB.184.16.4601-4611.2002</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Comparative genomics of Salmonella enterica serovar Typhi strains Ty2 and CT18</p>
            </title>
            <aug>
               <au>
                  <snm>Deng</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Liou</snm>
                  <fnm>SR</fnm>
               </au>
               <au>
                  <snm>Plunkett</snm>
                  <fnm>G</fnm>
                  <suf>3rd</suf>
               </au>
               <au>
                  <snm>Mayhew</snm>
                  <fnm>GF</fnm>
               </au>
               <au>
                  <snm>Rose</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Burland</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Kodoyianni</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Schwartz</snm>
                  <fnm>DC</fnm>
               </au>
               <au>
                  <snm>Blattner</snm>
                  <fnm>FR</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2003</pubdate>
            <volume>185</volume>
            <fpage>2330</fpage>
            <lpage>2337</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">151493</pubid>
                  <pubid idtype="pmpid" link="fulltext">12644504</pubid>
                  <pubid idtype="doi">10.1128/JB.185.7.2330-2337.2003</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>The physical map of the whole E. coli chromosome: application of a new strategy for rapid analysis and sorting of a large genomic library</p>
            </title>
            <aug>
               <au>
                  <snm>Kohara</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Akiyama</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Isono</snm>
                  <fnm>K</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1987</pubdate>
            <volume>50</volume>
            <fpage>495</fpage>
            <lpage>508</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0092-8674(87)90503-4</pubid>
                  <pubid idtype="pmpid" link="fulltext">3038334</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Pathogenic effects of Opolysaccharide from Shigella flexneri strain</p>
            </title>
            <aug>
               <au>
                  <snm>Zhong</snm>
                  <fnm>QP</fnm>
               </au>
            </aug>
            <source>World J Gastroenterol</source>
            <pubdate>1999</pubdate>
            <volume>5</volume>
            <issue>3</issue>
            <fpage>245</fpage>
            <lpage>248</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11819440</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Pathogenicity Islands in Bacterial Pathogenesis</p>
            </title>
            <aug>
               <au>
                  <snm>Herbert</snm>
                  <fnm>Schmidt</fnm>
               </au>
               <au>
                  <snm>Michael</snm>
                  <fnm>Hensel</fnm>
               </au>
            </aug>
            <source>Clin Microbiol Rev</source>
            <pubdate>2004</pubdate>
            <volume>17</volume>
            <issue>11</issue>
            <fpage>14</fpage>
            <lpage>56</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">321463</pubid>
                  <pubid idtype="pmpid" link="fulltext">14726454</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Pathogenicity islands of Shigella</p>
            </title>
            <aug>
               <au>
                  <snm>Ingersoll</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Groisman</snm>
                  <fnm>EA</fnm>
               </au>
               <au>
                  <snm>Zychlinsky</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Curr Top Microbiol Immunol</source>
            <pubdate>2002</pubdate>
            <volume>264</volume>
            <fpage>49</fpage>
            <lpage>65</lpage>
            <xrefbib>
               <pubid idtype="pmpid">12014181</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Molecular characterization of the genes involved in O-antigen modification, attachment, integration and excision in Shigella flexneri bacteriophage SfV</p>
            </title>
            <aug>
               <au>
                  <snm>Huan</snm>
                  <fnm>PT</fnm>
               </au>
               <au>
                  <snm>Bastin</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Whittle</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Lindberg</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Verma</snm>
                  <fnm>NK</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>1997</pubdate>
            <volume>195</volume>
            <fpage>217</fpage>
            <lpage>227</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1119(97)00143-1</pubid>
                  <pubid idtype="pmpid" link="fulltext">9305767</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Glycosyltransferases encoded by viruses</p>
            </title>
            <aug>
               <au>
                  <snm>Markine-Goriaynoff</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Gillet</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Van Etten</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Korres</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Verma</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Vanderplasschen</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2004</pubdate>
            <volume>85</volume>
            <fpage>2741</fpage>
            <lpage>2754</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1099/vir.0.80320-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">15448335</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>A provisional chromosome map of Shigella and the regions related to pathogenicity</p>
            </title>
            <aug>
               <au>
                  <snm>Petrovskaya</snm>
                  <fnm>VG</fnm>
               </au>
               <au>
                  <snm>Licheva</snm>
                  <fnm>TA</fnm>
               </au>
            </aug>
            <source>Acta Microbiol Acad Sci Hung</source>
            <pubdate>1982</pubdate>
            <volume>29</volume>
            <fpage>41</fpage>
            <lpage>53</lpage>
            <xrefbib>
               <pubid idtype="pmpid">7046354</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Mechanism of bacteriophage SfII-mediated serotype conversion in Shigella flexneri</p>
            </title>
            <aug>
               <au>
                  <snm>Mavris</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Manning</snm>
                  <fnm>PA</fnm>
               </au>
               <au>
                  <snm>Morona</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1997</pubdate>
            <volume>26</volume>
            <fpage>939</fpage>
            <lpage>950</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.1997.6301997.x</pubid>
                  <pubid idtype="pmpid">9426131</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Shigella flexneri type-specific antigen V: cloning, sequencing and characterization of the glucosyl transferase gene of temperate bacteriophage SfV</p>
            </title>
            <aug>
               <au>
                  <snm>Huan</snm>
                  <fnm>PT</fnm>
               </au>
               <au>
                  <snm>Whittle</snm>
                  <fnm>BL</fnm>
               </au>
               <au>
                  <snm>Bastin</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Lindberg</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Verma</snm>
                  <fnm>NK</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>1997</pubdate>
            <volume>195</volume>
            <fpage>207</fpage>
            <lpage>216</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0378-1119(97)00144-3</pubid>
                  <pubid idtype="pmpid" link="fulltext">9305766</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Distribution and structural variation of the she pathogenicity island in enteric bacterial pathogens</p>
            </title>
            <aug>
               <au>
                  <snm>Al-Hasani</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Adler</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Rajakumar</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Sakellaris</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>J Med Microbiol</source>
            <pubdate>2001</pubdate>
            <volume>50</volume>
            <fpage>780</fpage>
            <lpage>786</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11549179</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Regulated site-specific recombination of the she pathogenicity island of Shigella flexneri</p>
            </title>
            <aug>
               <au>
                  <snm>Sakellaris Harry</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Luck</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Shelley</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Al-Hasani</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Keith</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Rajakumar</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Kumar</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Turner</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Sally</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Adler</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Ben</snm>
                  <fnm/>
               </au>
            </aug>
            <source>Molecular Microbiology</source>
            <pubdate>2004</pubdate>
            <volume>52</volume>
            <issue>55</issue>
            <fpage>1329</fpage>
            <lpage>1336</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.2004.04048.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15165236</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>The selC-associated SHI-2 pathogenicity island of Shigella flexneri</p>
            </title>
            <aug>
               <au>
                  <snm>Moss</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Cardozo</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Zychlinsky</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Groisman</snm>
                  <fnm>EA</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1999</pubdate>
            <volume>33</volume>
            <fpage>74</fpage>
            <lpage>83</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.1999.01449.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">10411725</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Evidence for symmetric chromosomal inversions around the replication origin in bacteria</p>
            </title>
            <aug>
               <au>
                  <snm>Eisen</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Heidelberg</snm>
                  <fnm>JF</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2000</pubdate>
            <volume>1</volume>
            <issue>6</issue>
            <fpage>research0011.0011</fpage>
            <lpage>0011.0019</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1186/gb-2000-1-6-research0011</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Gene location affects expression level in Salmonella typhimurium</p>
            </title>
            <aug>
               <au>
                  <snm>Schmid</snm>
                  <fnm>MB</fnm>
               </au>
               <au>
                  <snm>Roth</snm>
                  <fnm>JR</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1987</pubdate>
            <volume>169</volume>
            <fpage>2872</fpage>
            <lpage>2875</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">212203</pubid>
                  <pubid idtype="pmpid">3294809</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Diversity of Genome Structure in Salmonella enterica Serovar Typhi Populations</p>
            </title>
            <aug>
               <au>
                  <snm>Sushma Kothapalli</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Satheesh Nair</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Suneetha Alokam</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Tikki Pang</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Rasik Khakhria</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>David Woodward</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Wendy Johnson</snm>
                  <fnm/>
               </au>
               <au>
                  <snm>Stocker</snm>
                  <mi>AD</mi>
                  <fnm>Bruce</fnm>
               </au>
               <au>
                  <snm>Sanderson</snm>
                  <mi>E</mi>
                  <fnm>Kenneth</fnm>
               </au>
               <au>
                  <snm>Shu-Lin Liu</snm>
                  <fnm/>
               </au>
            </aug>
            <source>J Bacteriology</source>
            <pubdate>2005</pubdate>
            <volume>187</volume>
            <issue>188</issue>
            <fpage>2638</fpage>
            <lpage>2650</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1128/JB.187.8.2638-2650.2005</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Choline-glycine betaine pathway confers a high level of osmotic tolerance in Escherichia coli</p>
            </title>
            <aug>
               <au>
                  <snm>Landfald</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Strom</snm>
                  <fnm>AR</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1986</pubdate>
            <volume>165</volume>
            <issue>3</issue>
            <fpage>849</fpage>
            <lpage>855</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">214506</pubid>
                  <pubid idtype="pmpid">3512525</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Glycine Betaine Uptake after Hyperosmotic Shift in Corynebacterium glutamicum</p>
            </title>
            <aug>
               <au>
                  <snm>Farwick</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Siewe</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Kramer</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>1995</pubdate>
            <volume>177</volume>
            <issue>16</issue>
            <fpage>4690</fpage>
            <lpage>4695</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">177234</pubid>
                  <pubid idtype="pmpid" link="fulltext">7642496</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Living with water stress: evolution of osmolyte systems</p>
            </title>
            <aug>
               <au>
                  <snm>Yancey</snm>
                  <fnm>PH</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Hand</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Bowlus</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Somero</snm>
                  <fnm>GN</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1982</pubdate>
            <volume>217</volume>
            <fpage>1214</fpage>
            <lpage>1222</lpage>
            <xrefbib>
               <pubid idtype="pmpid">7112124</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>Multiple independent origins of Shigella clones of Escherichia coli and convergent evolution of many of their characteristics</p>
            </title>
            <aug>
               <au>
                  <snm>Pupo</snm>
                  <fnm>GM</fnm>
               </au>
               <au>
                  <snm>Lan</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Reeves</snm>
                  <fnm>PR</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <volume>97</volume>
            <fpage>10567</fpage>
            <lpage>10572</lpage>
            <note>2000, Sep 12</note>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">27065</pubid>
                  <pubid idtype="pmpid" link="fulltext">10954745</pubid>
                  <pubid idtype="doi">10.1073/pnas.180094797</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Genome degradation is an ongoing process in Rickettsia</p>
            </title>
            <aug>
               <au>
                  <snm>Andersson</snm>
                  <fnm>JO</fnm>
               </au>
               <au>
                  <snm>Andersson</snm>
                  <fnm>SG</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1999</pubdate>
            <volume>16</volume>
            <issue>9</issue>
            <fpage>1178</fpage>
            <lpage>1191</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10486973</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>Base-calling of automated sequencer traces using Phred. I. Accuracy assessment</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wendl</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>175</fpage>
            <lpage>185</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521921</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Microbial gene identification using interpolated Markov models</p>
            </title>
            <aug>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Kasif</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm/>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1998</pubdate>
            <volume>26</volume>
            <fpage>544</fpage>
            <lpage>548</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">147303</pubid>
                  <pubid idtype="pmpid" link="fulltext">9421513</pubid>
                  <pubid idtype="doi">10.1093/nar/26.2.544</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>The COG database: a tool for genome-scale analysis of protein functions and evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Tatusov</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Galperin</snm>
                  <fnm>MY</fnm>
               </au>
               <au>
                  <snm>Natale</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Koonin</snm>
                  <fnm>EV</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2000</pubdate>
            <volume>28</volume>
            <fpage>33</fpage>
            <lpage>36</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">102395</pubid>
                  <pubid idtype="pmpid" link="fulltext">10592175</pubid>
                  <pubid idtype="doi">10.1093/nar/28.1.33</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>The IS FINDER Database</p>
            </title>
            <url>http://www-is.biotoul.fr</url>
         </bibl>
         <bibl id="B47">
            <title>
               <p>GenomeComp: a visualization tool for microbial genome comparison</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yao</snm>
                  <fnm>ZJ</fnm>
               </au>
               <au>
                  <snm>Jin</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Shen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>J Microbiol Methods</source>
            <pubdate>2003</pubdate>
            <volume>54</volume>
            <fpage>423</fpage>
            <lpage>426</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0167-7012(03)00094-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">12842490</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>The KEGG resource for deciphering the genome</p>
            </title>
            <aug>
               <au>
                  <snm>Kanehisa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Goto</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kawashima</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Okuno</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Hattori</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>D277</fpage>
            <lpage>D280</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">308797</pubid>
                  <pubid idtype="pmpid" link="fulltext">14681412</pubid>
                  <pubid idtype="doi">10.1093/nar/gkh063</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
