<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2006-7-10-r90</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>Genomic analysis reveals that <it>Pseudomonas aeruginosa </it>virulence is combinatorial</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Lee</snm>
               <mi>G</mi>
               <fnm>Daniel</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <insr iid="I3"/>
               <email>dgrenfell-lee@microbia.com</email>
            </au>
            <au id="A2">
               <snm>Urbach</snm>
               <mi>M</mi>
               <fnm>Jonathan</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>urbach@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A3">
               <snm>Wu</snm>
               <fnm>Gang</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>gwu@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A4">
               <snm>Liberati</snm>
               <mi>T</mi>
               <fnm>Nicole</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>liberati@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A5">
               <snm>Feinbaum</snm>
               <mi>L</mi>
               <fnm>Rhonda</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>feinbaum@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A6">
               <snm>Miyata</snm>
               <fnm>Sachiko</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>miyata@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A7">
               <snm>Diggins</snm>
               <mi>T</mi>
               <fnm>Lenard</fnm>
               <insr iid="I4"/>
               <email>diggins@envivopharma.com</email>
            </au>
            <au id="A8">
               <snm>He</snm>
               <fnm>Jianxin</fnm>
               <insr iid="I5"/>
               <insr iid="I6"/>
               <email>he@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A9">
               <snm>Saucier</snm>
               <fnm>Maude</fnm>
               <insr iid="I5"/>
               <insr iid="I6"/>
               <insr iid="I7"/>
               <email>maude.saucier@umontreal.ca</email>
            </au>
            <au id="A10">
               <snm>D&#233;ziel</snm>
               <fnm>Eric</fnm>
               <insr iid="I5"/>
               <insr iid="I6"/>
               <insr iid="I8"/>
               <email>eric.deziel@iaf.inrs.ca</email>
            </au>
            <au id="A11">
               <snm>Friedman</snm>
               <fnm>Lisa</fnm>
               <insr iid="I5"/>
               <insr iid="I9"/>
               <email>Lisa.Friedman@cubist.com</email>
            </au>
            <au id="A12">
               <snm>Li</snm>
               <fnm>Li</fnm>
               <insr iid="I10"/>
               <email>lili@rics.bwh.harvard.edu</email>
            </au>
            <au id="A13">
               <snm>Grills</snm>
               <fnm>George</fnm>
               <insr iid="I10"/>
               <insr iid="I11"/>
               <email>gsg34@cornell.edu</email>
            </au>
            <au id="A14">
               <snm>Montgomery</snm>
               <fnm>Kate</fnm>
               <insr iid="I10"/>
               <email>kmontgomery@rics.bwh.harvard.edu</email>
            </au>
            <au id="A15">
               <snm>Kucherlapati</snm>
               <fnm>Raju</fnm>
               <insr iid="I10"/>
               <email>rkucherlapati@partners.org</email>
            </au>
            <au id="A16">
               <snm>Rahme</snm>
               <mi>G</mi>
               <fnm>Laurence</fnm>
               <insr iid="I5"/>
               <insr iid="I6"/>
               <email>rahme@molbio.mgh.harvard.edu</email>
            </au>
            <au id="A17" ca="yes">
               <snm>Ausubel</snm>
               <mi>M</mi>
               <fnm>Frederick</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>ausubel@molbio.mgh.harvard.edu</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Department of Molecular Biology, Massachusetts General Hospital, Cambridge Street, Boston, Massachusetts, 02114, USA</p>
            </ins>
            <ins id="I2">
               <p>Department of Genetics, Harvard Medical School, Avenue Louis Pasteur, Boston, Massachusetts, 02115, USA</p>
            </ins>
            <ins id="I3">
               <p>Current address: Microbia, Inc., Bent Street, Cambridge, Massachusetts, 02141, USA</p>
            </ins>
            <ins id="I4">
               <p>Envivo Pharmaceuticals, Inc., Arsenal Street, Watertown, Massachusetts, 02472, USA</p>
            </ins>
            <ins id="I5">
               <p>Department of Microbiology and Molecular Genetics, Harvard Medical School, Longwood Avenue, Boston, Massachusetts, 02115. USA</p>
            </ins>
            <ins id="I6">
               <p>Department of Surgery, Massachusetts General Hospital, Fruit Street, Boston, Massachusetts, 02114, USA</p>
            </ins>
            <ins id="I7">
               <p>Current address: Universit&#233; de Montr&#233;al, Station Centre-ville, Montr&#233;al, H3C 3J7, Canada</p>
            </ins>
            <ins id="I8">
               <p>Current address: INRS-Institut Armand-Frappier, boul. des Prairies, Laval, Quebec, H7V 1B7, Canada</p>
            </ins>
            <ins id="I9">
               <p>Current address: Cubist Pharmaceuticals, Inc., Hayden Avenue, Lexington, Massachusetts, 02421, USA</p>
            </ins>
            <ins id="I10">
               <p>Harvard Medical School - Partners Healthcare Center for Genetics and Genomics, Landsdowne Street, Cambridge, Massachusetts, 02139, USA</p>
            </ins>
            <ins id="I11">
               <p>Current address: Core Facilities, Cornell University, Thurston Avenue, Ithaca, New York, 14850, USA</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2006</pubdate>
         <volume>7</volume>
         <issue>10</issue>
         <fpage>R90</fpage>
         <url>http://genomebiology.com/2006/7/10/R90</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17038190</pubid>
               <pubid idtype="doi">10.1186/gb-2006-7-10-r90</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>28</day>
               <month>7</month>
               <year>2006</year>
            </date>
         </rec>
         <revrec>
            <date>
               <day>25</day>
               <month>9</month>
               <year>2006</year>
            </date>
         </revrec>
         <acc>
            <date>
               <day>12</day>
               <month>10</month>
               <year>2006</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>12</day>
               <month>10</month>
               <year>2006</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2006</year>
         <collab>Lee et al.; licensee BioMed Central Ltd</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p><it>Pseudomonas aeruginosa </it>virulence</p>
      </shorttitle>
      <shortabs>
         <p>Sequencing of a highly virulent strain of <it>Pseudomonas aeruginosa </it>and comparison to a previously sequenced, less pathogenic, strain, together with experimental testing in a <it>C. elegans model</it>, suggests that <it>Pseudomonas </it>virulence is multifactorial and combinatorial.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p><it>Pseudomonas aeruginosa </it>is a ubiquitous environmental bacterium and an important opportunistic human pathogen. Generally, the acquisition of genes in the form of pathogenicity islands distinguishes pathogenic isolates from nonpathogens. We therefore sequenced a highly virulent strain of <it>P. aeruginosa</it>, PA14, and compared it with a previously sequenced (and less pathogenic) strain, PAO1, to identify novel virulence genes.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The PA14 and PAO1 genomes are remarkably similar, although PA14 has a slightly larger genome (6.5 megabses [Mb]) than does PAO1 (6.3 Mb). We identified 58 PA14 gene clusters that are absent in PAO1 to determine which of these genes, if any, contribute to its enhanced virulence in a <it>Caenorhabditis elegans </it>pathogenicity model. First, we tested 18 additional diverse strains in the <it>C. elegans </it>model and observed a wide range of pathogenic potential; however, genotyping these strains using a custom microarray showed that the presence of PA14 genes that are absent in PAO1 did not correlate with the virulence of these strains. Second, we utilized a full-genome nonredundant mutant library of PA14 to identify five genes (absent in PAO1) required for <it>C. elegans </it>killing. Surprisingly, although these five genes are present in many other <it>P. aeruginosa </it>strains, they do not correlate with virulence in <it>C. elegans</it>.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>Genes required for pathogenicity in one strain of <it>P. aeruginosa </it>are neither required for nor predictive of virulence in other strains. We therefore propose that virulence in this organism is both multifactorial and combinatorial, the result of a pool of pathogenicity-related genes that interact in various combinations in different genetic backgrounds.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010014">Microbiology and parasitology</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The potential virulence of bacterial pathogens is significantly modulated by the presence of pathogenicity islands <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr></abbrgrp>, which are clusters of one or more virulence-related genes that are often acquired by horizontal gene transfer. The introduction of these virulence islands can allow a previously nonvirulent isolate to infect a particular host. Commonly, this switch to a simpler and more stable environment within a host (as opposed to the more complex outside environment) is followed by gene loss and genome reduction that improve the ability of the pathogen to survive in the host but also restrict the range of hosts available to the bacterium <abbrgrp><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr></abbrgrp>. In contrast, free-living bacteria that dominate in complex environments (such as soil) tend to have genomes that continue to acquire DNA and undergo expansion rather than reduction.</p>
         <p><it>Pseudomonas aeruginosa</it>, a ubiquitous Gram-negative soil organism, is an important opportunistic human pathogen that infects injured, burned, immunodeficient, and immunocompromised patients, and causes persistent respiratory infections in individuals suffering from cystic fibrosis (CF) <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr></abbrgrp>. The genome sequence of the widely studied <it>P. aeruginosa </it>strain PAO1 (originally a wound isolate) revealed that it possesses a large number of genes that are involved in regulation, catabolism, transport, and efflux of organic compounds, as well as several putative chemotaxis systems <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>, all of which potentially contribute to the remarkable ability of this bacterium to adapt to a wide range of environmental niches.</p>
         <p>Different <it>P. aeruginosa </it>isolates share a remarkable amount of similarity in their genomes. When DNA derived from several <it>P. aeruginosa </it>strains was hybridized to a PAO1 microarray, between 89% and 98% of the PAO1 sequences were detected <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>. Whole-genome shotgun sequencing of two CF isolates and one environmental strain revealed that, aside from this apparent highly conserved core set of <it>P. aeruginosa </it>genes, differences were largely due to strain-specific islands of genes, consisting either of genes with similar or related function but divergent DNA sequences (such as genes for biosynthesis of the O-antigen component of lipopolysaccharide, genes for flagellar biosynthesis, or alternate forms of genes for the bacteriocidal pyocins) or genes that are entirely absent in some strains <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>.</p>
         <p>Despite the overall genome similarity among diverse <it>P. aeruginosa </it>strains, differences in complex phenotypes such as pathogenicity can be striking. For example, the clinical isolate PA14 is significantly more virulent than PAO1 in a wide range of hosts, including mice, the nematode <it>Caenorhabditis elegans</it>, the insect <it>Galleria mellonella</it>, and the plant <it>Arabidopsis thaliana </it><abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr></abbrgrp>. PA14 genes required for full virulence include genes common to many if not all <it>P. aeruginosa </it>strains, including global transcriptional regulators such as <it>gacA</it>; genes that are involved in pathogenesis-related processes such as motility, quorum sensing, and phenazine biosynthesis; and genes that encode secreted cellulytic factors and toxins such as <it>ExoU</it>, exotoxin A, phospholipase C, and elastase <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>. On the other hand, novel PA14 genes that are absent in PAO1 (and potentially absent in other isolates) have also been identified as being required for pathogenicity in model hosts and mice <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B15">15</abbr><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>, and at least some of these genes appear to reside on large pathogenicity islands <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. Taken together, these studies suggest that PA14 pathogenicity is multifactorial, requiring the cumulative (and potentially coordinated) action of multiple virulence factors, some of which are components of the basic core genome, whereas others are located on classically defined virulence islands.</p>
         <p>The experiments described in this paper were designed to test the hypothesis that the enhanced virulence of PA14 compared with PAO1 is mostly a consequence of recognizable pathogenicity (virulence) islands that are present in PA14 but absent in PAO1. To expand our tools for dissecting <it>P. aeruginosa </it>virulence and to test the hypothesis that strain differences in virulence are due to the acquisition of strain-specific genes, we sequenced the PA14 genome and performed a functional analysis of genes that are present in PA14 but absent in PAO1 to assess their contribution to pathogenicity.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>PA14 genome sequence</p>
            </st>
            <p>To identify all of the putative pathogenicity islands that distinguish PA14 from PAO1, we sequenced the PA14 genome and found that it contains a slightly larger chromosome (6.5 megabases [Mb] versus 6.3 Mb for PAO1; genome sequence and annotations are available at the Ausubel lab PA14 sequencing website <abbrgrp><abbr bid="B20">20</abbr></abbrgrp> and have also been deposited in GenBank [GenBank: <ext-link ext-link-type="gen" ext-link-id="CP000438">CP000438</ext-link>]). Consistent with previous observations that overall strain similarity is high, we found that approximately 91.7% of the PA14 genome is present in PAO1, and that 95.8% of the PAO1 genome is present in PA14 (Table <tblr tid="T1">1</tblr>).</p>
            <tbl id="T1" hint_layout="double">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>PA14 and PAO1 genome comparisons</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>PA14</p>
                     </c>
                     <c ca="left">
                        <p>PAO1</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Genome size</p>
                     </c>
                     <c ca="left">
                        <p>6,537,648</p>
                     </c>
                     <c ca="left">
                        <p>6,264,403</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GC content</p>
                     </c>
                     <c ca="left">
                        <p>66.3 &#177; 4.3%<sup>a</sup></p>
                     </c>
                     <c ca="left">
                        <p>66.6 &#177; 3.9%<sup>a</sup></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total number of genes</p>
                     </c>
                     <c ca="left">
                        <p>5973</p>
                     </c>
                     <c ca="left">
                        <p>5651</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 1 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>8.6%</p>
                     </c>
                     <c ca="left">
                        <p>9.0%</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 2 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>18.0%</p>
                     </c>
                     <c ca="left">
                        <p>20.0%</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 3 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>44.5%</p>
                     </c>
                     <c ca="left">
                        <p>26.8%</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 4 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>28.9%</p>
                     </c>
                     <c ca="left">
                        <p>44.2%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Number of strain-specific regions<sup>c</sup></p>
                     </c>
                     <c ca="left">
                        <p>58</p>
                     </c>
                     <c ca="left">
                        <p>54</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total DNA in strain-specific regions</p>
                     </c>
                     <c ca="left">
                        <p>541,215 (8.3%)</p>
                     </c>
                     <c ca="left">
                        <p>261,426 (4.2%)</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>GC content (strain-specific regions)</p>
                     </c>
                     <c ca="left">
                        <p>59.60%</p>
                     </c>
                     <c ca="left">
                        <p>59.80%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total number of genes (strain-specific regions)</p>
                     </c>
                     <c ca="left">
                        <p>478</p>
                     </c>
                     <c ca="left">
                        <p>234</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 1 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>3.3%</p>
                     </c>
                     <c ca="left">
                        <p>9.8%</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 2 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>4.0%</p>
                     </c>
                     <c ca="left">
                        <p>3.0%</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 3 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>29.7%</p>
                     </c>
                     <c ca="left">
                        <p>30.8%</p>
                     </c>
                  </r>
                  <r>
                     <c indent="1" ca="left">
                        <p>Class 4 genes<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>63.0%</p>
                     </c>
                     <c ca="left">
                        <p>56.4%</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a</sup>Standard deviation was calculated using a sliding 1 kb window (see Additional data file 1). <sup>b</sup>Classes 1-4 refer to the confidence rating assigned to the predicted gene function, as previously described [7,22]. Class 1 genes are those whose function has been experimentally validated in <it>P. aeruginosa</it>. Class 2 genes are highly similar to genes whose functions have been validated in another organism. Class 3 genes have hypothesized functions based on limited similarity to other genes or structural/functional domains. Class 4 genes are open reading frames (ORFs) of unknown function. <sup>c</sup>Strain-specific regions with at least one ORF.</p>
               </tblfn>
            </tbl>
            <p>The PA14 and PAO1 genomes are largely colinear with the exception of one major rearrangement that has previously been described: an inversion between two of four dispersed copies of a large ribosomal RNA cluster (Figure <figr fid="F1">1</figr><abbrgrp><abbr bid="B7">7</abbr></abbrgrp>). We used long-range polymerase chain reaction (PCR) spanning the rRNA clusters to verify the inversion in the sequenced PA14 and PAO1 genomes; PCR products predicted to be indicative of one orientation or the other were only generated when either PAO1 or PA14 DNA was used as the template (Figure <figr fid="F2">2a,b</figr>). When 18 diverse <it>P. aeruginosa </it>strains were subjected to this same PCR analysis, all 18 of these isolates were the same or resembled PA14 genome structure with respect to the large inversion, whereas none of the 18 strains had or resembled the PAO1 genome structure (data not shown). Of note, additional PAO1 clones (distinct from the isolate that was sequenced) also appear to contain the same inversion found in PA14 <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>.</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Circular map of the PA14 genome</p>
               </caption>
               <text>
                  <p>Circular map of the PA14 genome. The outermost circle represents the chromosomal location: major and minor ticks represent 500 and 100 kb increments, respectively. The origin and presumptive terminus of replication are indicated by green and red arrows, respectively. The locations and orientations of predicted genes are shown by rectangles in the next pair of circles; genes on the outer circle are transcribed on the plus strand and genes on the inner circle are transcribed on the minus strand. The genes are color-coded according to functional categories (see below). Blue arrow heads indicated the locations and relative orientations of four ribosomal RNA gene clusters; the published PAO1 sequence contains an inversion (gray arrow) with respect to PA14 resulting from a presumptive recombination event between two of the rRNA clusters. The innermost circle represents the GC content as calculated for non-overlapping 1 kb windows of the plus strand. A linear map and full annotations of each gene (including color codes for functional categories) are available at the Ausubel lab PA14 sequencing website [20] and the full sequence and annotations have been deposited in GenBank (GenBank: <ext-link ext-link-type="gen" ext-link-id="CP000438">CP000438</ext-link>).</p>
               </text>
               <graphic file="gb-2006-7-10-r90-1"/>
            </fig>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Chromosomal rearrangement in PAO1 repositions the replication terminus relative to the origin</p>
               </caption>
               <text>
                  <p>Chromosomal rearrangement in PAO1 repositions the replication terminus relative to the origin. <b>(a) </b>Schematic of PAO1 and PA14 chromosomes. The region with the same orientation in both strains is shown with a thick red line; a thin blue line represents the inverted region. Arrows represent the positions and orientations of the four ribosomal RNA clusters. PCR products designed with unique sequences flanking each rRNA cluster are indicated by numbers next to each arrow. PCR products 1 and 2 (purple numbers) are diagnostic for the PAO1 chromosome structure; PCR products 3 and 4 (black numbers) are diagnostic for the PA14 chromosome structure. The position of the presumptive terminus of replication in each strain is indicated by an orange triangle marked with the corresponding position along the chromosome (expressed as the percentage of the whole chromosome, starting from the origin of replication and moving in a clockwise direction). <b>(b) </b>Diagnostic long-range PCR spanning each ribosomal RNA repeat demonstrates the inversion in PAO1. PCR products corresponding to the numbers indicated in panel a were generated using genomic DNA from PAO1 (left panel) or PA14 (right panel). PCR products 1 and 2 were obtained only when using PAO1 genomic DNA (the weak background band for product 1 seen using PA14 as a template was also observed for 18 additional <it>P. aeruginosa </it>strains tested). PCR products 3 and 4 were obtained only when using PA14 genomic DNA. PCR products 5 and 6 were obtained from both strains. <b>(c) </b>GC skew analysis was performed using 1 kb windows, and the cumulative GC skew is shown on the y-axis as a function of chromosomal location (x-axis) for PA14 (black line) and PAO1 (purple line). The position of the peak indicates the likely position of the terminus of replication. For PA14 the peak is centered in the middle of the chromosome (at 49.2% of the genome, between coordinates 3,219,001 and 3,220,000), whereas the peak for PAO1 is offset with respect to the origin of replication as a result of the inversion (occurring at 38.8% of the genome, between coordinates 2,428,001 and 2,429,000). PCR, polymerase chain reaction.</p>
               </text>
               <graphic file="gb-2006-7-10-r90-2"/>
            </fig>
            <p>We also compared the GC skews of the PA14 and PAO1 genomes. GC skew is defined as the value of [G-C]/[G+C] where G and C represent the local base frequencies of G and C, respectively. In prokaryotic genomes there is a bias toward G over C on the leading strand of DNA synthesis <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. Therefore, when measured at regular intervals along the chromosome (1 kilobase [kb] segments) GC skew tends to have a positive value on the leading strand of DNA synthesis and a negative value on the lagging strand, resulting in polarity changes at the origin and terminus of replication. The putative position of the replicative terminus is therefore operationally defined as the peak of the cumulative GC skew and it typically resides opposite the origin of replication in bacterial genomes <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. For PA14, the peak GC skew was indeed mapped opposite the replication origin (at 49.2% of the genome; Figure <figr fid="F2">2a,c</figr>). In contrast, the position of the terminus in the sequenced PAO1 chromosome is shifted relative to the origin (at 38.8% of the genome). These observations argue that the PA14 chromosome with respect to this large inversion is more representative of the canonical or ancestral <it>P. aeruginosa </it>genome than that of the sequenced PAO1 isolate. This interpretation that is further supported by the finding that the inversion in the sequenced strain occurred sometime after 1990 (a PAO1 cosmid library originally described in that year was shown not to contain the inversion <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>). However, the physiologic consequences of such an inversion and asymmetric replication cycle are not clear.</p>
         </sec>
         <sec>
            <st>
               <p>PA14 gene annotation</p>
            </st>
            <p>We annotated the PA14 genome and identified 5973 predicted open reading frames (ORFs; 322 more than in PAO1; Table <tblr tid="T1">1</tblr>). Summaries of all predicted PA14 genes and their distribution among different functional categories are presented in Additional data files 2 and 3, respectively. We performed a reciprocal NCBI-BLAST (basic local alignment search tool) search of each gene in either PA14 or PAO1 against the total collection of genes in the other strain (specifically, each PA14 gene was BLASTed against the complete set of PAO1 genes, and <it>vice versa</it>). The position of each best BLAST hit was plotted (with the PA14 genomic location on the x-axis, and the PAO1 coordinate on the y-axis; Figure <figr fid="F3">3</figr>), confirming that the two genomes are largely colinear, with the exception of the large inversion described above. Individual PA14 genes that had no counterpart in PAO1 are shown as individual (green) data points on the x-axis, and PAO1 genes absent in PA14 are represented as (pink) data points on the y-axis. Large clusters of these strain-specific genes often correlated with regions of the respective genomes in which the local GC content was lower than that of the total genome (Figure <figr fid="F3">3</figr>).</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>ORF-by-ORF alignments of PA14 and PAO1</p>
               </caption>
               <text>
                  <p>ORF-by-ORF alignments of PA14 and PAO1. Each predicted ORF in PA14 was compared using BLAST with all annotated PAO1 ORFs, and the best match was indicated as a single data point with the chromosomal locations of the match in each genome. Reciprocal BLAST searches were also performed (using individual PAO1 ORFs against the complete set of PA14 ORFs). Matches in the forward direction are indicated by red diamonds, and matches in the reverse orientation are indicated by blue diamonds. Genes that fall outside of the diagonals (non-colinear genes) are a combination of translocations and gene pairs in which a true ortholog is missing in one strain but a similar gene exists elsewhere in its genome and the two genes have been selected as reciprocal best BLAST matches. Genes in one genome that fail to have a BLAST match counterpart in the other genome are represented on the x-axis for PA14-specific genes (green diamonds) and on the y-axis for PAO1-specific genes (pink diamonds). The GC contents for each genome are represented next to the two axes using a light-blue graph; the positions that correspond to GC contents of 30%, 50%, and 70% are indicated. BLAST, basic local alignment search tool; ORF, open reading frame.</p>
               </text>
               <graphic file="gb-2006-7-10-r90-3"/>
            </fig>
            <p>Using a combination of raw sequence and ORF-based global alignments of the two genomes, we compiled a list of gene clusters present in one strain but absent in the other (58 PA14 regions absent in PAO1 containing 478 genes, and 54 PAO1 regions absent in PA14 containing 234 genes; Table <tblr tid="T1">1</tblr> and Additional data file 4). We refer to these as PA14-specific or PAO1-specific regions for the purposes of this discussion (recognizing that these genes may be present in other isolates of <it>P. aeruginosa </it>and are not strictly strain specific). Many of these gene clusters have hallmarks of horizontally acquired DNA, including direct repeats, insertion sequences, tRNA genes at their boundaries (data not shown), and/or anomalous GC contents (PA14-specific clusters have an average GC content of 59.6%, which is more than one standard deviation below the whole genome average of 66.3%; Table <tblr tid="T1">1</tblr>).</p>
            <p>These strain-specific regions contain a high proportion of genes of unknown function as compared with the whole genome. Each PA14 (and PAO1) annotation has a confidence score associated with the described gene function <abbrgrp><abbr bid="B7">7</abbr><abbr bid="B22">22</abbr></abbrgrp>. A class 1 designation refers to genes whose functions have been experimentally validated in <it>P. aeruginosa</it>, class 2 genes are highly similar to genes whose functions have been validated in other organisms, class 3 genes have hypothesized functions based on limited similarity to other genes or structural/functional domains, and class 4 genes are ORFs of unknown function. For the PA14-specific regions, 63% of the predicted ORFs have no known function, whereas only 28.9% of genes in the whole genome have class 4 annotations (Table <tblr tid="T1">1</tblr>). Therefore, gene identity alone could not indicate whether virulence-related genes were enriched in PA14-specific regions.</p>
         </sec>
         <sec>
            <st>
               <p>Conservation of PA14-specific genes and their putative role in virulence</p>
            </st>
            <p>If a PA14 strain-specific region were functioning as a canonical pathogenicity island, then it should be more prevalent among other pathogenic isolates (and less prevalent among avirulent isolates). To test this hypothesis we needed to establish an objective measure of pathogenicity to compare different <it>P. aeruginosa </it>strains as well as to develop a high throughput method for determining the genomic content of the different strains. We used a model host infection system (the nematode <it>Caenorhabditis elegans</it>) to rank order the virulence of 18 diverse <it>P. aeruginosa </it>strains, using PA14 and PAO1 as reference strains. The 18 <it>P. aeruginosa </it>strains included 13 clinical isolates from a variety of infection types (CF lung infections, urinary tract infections, ocular infections, and blood isolates), one laboratory strain, and four environmental isolates. This same set of strains had been used in a previous study of <it>P. aeruginosa </it>strain diversity <abbrgrp><abbr bid="B9">9</abbr></abbrgrp>. We used a custom microarray-based system (described below) to determine relatedness of the 20 (18 plus PAO1 and PA14) <it>P. aeruginosa </it>strains.</p>
            <p>In the <it>C. elegans </it>model pathogenicity system <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, an age-synchronized population of nematodes is fed the pathogen to be tested (instead of <it>Escherichia coli</it>, its traditional laboratory food source) and the longevity of the nematodes is determined. As shown previously, the longevity of <it>C. elegans </it>feeding on a particular <it>P. aeruginosa </it>strain correlates with virulence of the strain in mice <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B15">15</abbr><abbr bid="B18">18</abbr></abbrgrp>. The set of <it>P. aeruginosa </it>strains tested exhibited a full range of virulence phenotypes, including both the upper and lower limits that the assay system is capable of measuring (Figure <figr fid="F4">4a</figr>). PA14 (dark blue diamonds, second curve from the left) is extremely efficient at killing nematodes, whereas the less pathogenic PAO1 is intermediate (pink squares), killing more slowly than PA14 but more quickly than <it>E. coli </it>(negative control; yellow squares, second curve from the right).</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Poor correlation between PA14-pathogenicity genes and virulence in other strains</p>
               </caption>
               <text>
                  <p>Poor correlation between PA14-pathogenicity genes and virulence in other strains. <b>(a) </b><it>C. elegans </it>survival curves in the presence of 19 <it>P. aeruginosa </it>strains and OP50 (an <it>E. coli </it>control). The names of each strain tested are sorted according to the rank order of virulence, from most virulent at the top to the least virulent at the bottom, as determined by examining the time required to kill 50% of the nematodes. Black brackets indicate strains with indistinguishable virulence. Strain names are followed by the strain source and color-coded by strain source, as shown in panel b. Strain CF27 is not shown in this dataset; however, a similar experiment places its rank order virulence between strains E2 and S36004 (indicated by a black arrow). The same relative rank orders were obtained in two additional experiments. <b>(b) </b>Dendrogram representing the relatedness of 20 <it>P. aeruginosa </it>strains based on the presence or absence of genes as assayed by genomic DNA hybridizations to a custom microarray. Hierarchical clustering analysis was performed using the city-block distance metric. The name of each strain is shown, along with the source of the strain (UTI, urinary tract infection; CF, cystic fibrosis respiratory infection; env, environmental isolate), and the rank order virulence of each strain as determined in panel a (1, most virulent; 20, least virulent). Strains with indistinguishable virulence were given a tied rank order (also see Table 2). <b>(c) </b>Presence or absence of PA14 virulence genes in additional isolates. Data for each strain tested is presented in columns. Strains are arranged in order from left to right in order of decreasing virulence, in the same order as shown in panel a; column headers refer to the 20 strain numbers used in Table 2. Columns with no gaps between them represent groups of strains with indistinguishable virulence (strains 4 and 5; strains 8, 9 and 10; and strains 14, 15 and 16). Genes assayed are represented as rows, with adjacent rows representing ORFs present within a given gene cluster (PA14 region names shown on the left are abbreviated to remove the 'PA14' prefix). Each gene is described as present (blue), absent (yellow), or indeterminate (red). The positions of mutations resulting in reduced virulence in PA14 are indicated by lines to the right; numbers in black refer to entries in Table 3, and red numbers in parenthesis indicate the Spearman's rank correlation coefficients between presence or absence of the gene in other strains and their rank order virulence ratings.</p>
               </text>
               <graphic file="gb-2006-7-10-r90-4"/>
            </fig>
            <p>The observation that PAO1 is more virulent than many other tested strains suggests that it has not become attenuated because of extensive passaging in the laboratory; rather, its virulence is probably that of a moderately pathogenic strain, with other strains more representative of truly 'avirulent' isolates. When comparing strains derived from the same type of infection, there was no consistent clustering with respect to their phenotype in <it>C. elegans</it>. For example, both the most and the least virulent strains tested were isolates from CF infections. Similarly, the five urinary tract infection strains exhibited a wide range of virulent to avirulent phenotypes. Importantly, two closely related environmental isolates (MSH3 and MSH10) were the fourth and fifth most virulent strains tested, indicating that nonclinically isolated strains can also have the potential to be infectious.</p>
            <p>To test the hypothesis that the virulence of the 20 <it>P. aeruginosa </it>strains correlates with the presence of particular virulence islands, we performed a microarray-based analysis of the genomic content (a process described as genomotyping <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>) of the <it>P. aeruginosa </it>strains. We arrayed 285 synthetic oligonucleotides (70 mers) corresponding to PA14 genes that are absent in PAO1 and 130 oligonucleotides corresponding to PAO1 genes that are absent in PA14, along with additional sequences serving as positive and negative controls (see Materials and methods, below, and Additional data files 5 and 6). We first used the array data to generate a hierarchic clustering dendrogram showing the relatedness of the 20 <it>P. aeruginosa </it>strains (Figure <figr fid="F4">4b</figr>). Next, we used the <it>C. elegans </it>virulence data in Figure <figr fid="F4">4a</figr> to rank order the 20 strains and then examine the microarray data to determine whether the presence or absence of PA14-specific (or PAO1-specific) genes correlated with virulence (also see Table <tblr tid="T2">2</tblr> and Additional data file 6). Strains were ordered from the most virulent (rank order 1) to the least virulent (rank order 20), with strains that had equivalent virulence assigned a tied rank. When the virulence rank order of each strain was superimposed on the dendrogram describing the relatedness of each strain based on genomic content (Figure <figr fid="F4">4b</figr>), no strong correlation was observed with the relative virulence of each strain in <it>C. elegans</it>. There are small clusters of similarly avirulent or virulent strains; for example, strains 6077, U2504, JJ692, S54485, and X13273 grouped together and possess similar virulence rankings (10, 6, 12, 10, and 10, respectively). However, these small clusters were occasionally punctuated by exceptions: a cluster of weakly virulent or avirulent strains (CF5, E2, PAK and CF27, with rank orders of 20, 17, 13, and 18, respectively) also includes strain UDL, which is the third most pathogenic strain tested.</p>
            <tbl id="T2" hint_layout="double">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Relative virulence of <it>P. aeruginosa </it>strains in <it>C. elegans</it></p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="left">
                        <p>Strain number<sup>a</sup></p>
                     </c>
                     <c ca="left">
                        <p>Strain name</p>
                     </c>
                     <c ca="left">
                        <p>Strain source<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>Rank order of virulence in <it>C. elegans</it><sup>c</sup></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>1</p>
                     </c>
                     <c ca="left">
                        <p>CF18</p>
                     </c>
                     <c ca="left">
                        <p>CF</p>
                     </c>
                     <c ca="left">
                        <p>1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="left">
                        <p>PA14</p>
                     </c>
                     <c ca="left">
                        <p>burn</p>
                     </c>
                     <c ca="left">
                        <p>2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>3</p>
                     </c>
                     <c ca="left">
                        <p>UDL</p>
                     </c>
                     <c ca="left">
                        <p>UTI</p>
                     </c>
                     <c ca="left">
                        <p>3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>4</p>
                     </c>
                     <c ca="left">
                        <p>MSH3</p>
                     </c>
                     <c ca="left">
                        <p>Environmental</p>
                     </c>
                     <c ca="left">
                        <p>5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>5</p>
                     </c>
                     <c ca="left">
                        <p>MSH10</p>
                     </c>
                     <c ca="left">
                        <p>Environmental</p>
                     </c>
                     <c ca="left">
                        <p>5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>6</p>
                     </c>
                     <c ca="left">
                        <p>U2504</p>
                     </c>
                     <c ca="left">
                        <p>UTI</p>
                     </c>
                     <c ca="left">
                        <p>6</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>7</p>
                     </c>
                     <c ca="left">
                        <p>62</p>
                     </c>
                     <c ca="left">
                        <p>Environmental</p>
                     </c>
                     <c ca="left">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>8</p>
                     </c>
                     <c ca="left">
                        <p>6077</p>
                     </c>
                     <c ca="left">
                        <p>Ocular</p>
                     </c>
                     <c ca="left">
                        <p>10</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>9</p>
                     </c>
                     <c ca="left">
                        <p>S54485</p>
                     </c>
                     <c ca="left">
                        <p>UTI</p>
                     </c>
                     <c ca="left">
                        <p>10</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>10</p>
                     </c>
                     <c ca="left">
                        <p>X13273</p>
                     </c>
                     <c ca="left">
                        <p>Blood</p>
                     </c>
                     <c ca="left">
                        <p>10</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>11</p>
                     </c>
                     <c ca="left">
                        <p>PAO1</p>
                     </c>
                     <c ca="left">
                        <p>Wound</p>
                     </c>
                     <c ca="left">
                        <p>11</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>12</p>
                     </c>
                     <c ca="left">
                        <p>JJ692</p>
                     </c>
                     <c ca="left">
                        <p>UTI</p>
                     </c>
                     <c ca="left">
                        <p>12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>13</p>
                     </c>
                     <c ca="left">
                        <p>PAK</p>
                     </c>
                     <c ca="left">
                        <p>Laboratory</p>
                     </c>
                     <c ca="left">
                        <p>13</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>14</p>
                     </c>
                     <c ca="left">
                        <p>19660</p>
                     </c>
                     <c ca="left">
                        <p>Ocular</p>
                     </c>
                     <c ca="left">
                        <p>16</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>15</p>
                     </c>
                     <c ca="left">
                        <p>X24509</p>
                     </c>
                     <c ca="left">
                        <p>UTI</p>
                     </c>
                     <c ca="left">
                        <p>16</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>16</p>
                     </c>
                     <c ca="left">
                        <p>CF127</p>
                     </c>
                     <c ca="left">
                        <p>CF</p>
                     </c>
                     <c ca="left">
                        <p>16</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>17</p>
                     </c>
                     <c ca="left">
                        <p>E2</p>
                     </c>
                     <c ca="left">
                        <p>Environmental</p>
                     </c>
                     <c ca="left">
                        <p>17</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>18</p>
                     </c>
                     <c ca="left">
                        <p>CF27</p>
                     </c>
                     <c ca="left">
                        <p>CF</p>
                     </c>
                     <c ca="left">
                        <p>18<sup>d</sup></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>19</p>
                     </c>
                     <c ca="left">
                        <p>S35004</p>
                     </c>
                     <c ca="left">
                        <p>Blood</p>
                     </c>
                     <c ca="left">
                        <p>19</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>20</p>
                     </c>
                     <c ca="left">
                        <p>CF5</p>
                     </c>
                     <c ca="left">
                        <p>CF</p>
                     </c>
                     <c ca="left">
                        <p>20</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a</sup>This strain number corresponds to the order in which strains are listed in Figure 4c (microarray) from left to right. <sup>b</sup>References for each strain are listed in the report by Wolfgang and coworkers [9]. <sup>c</sup>Identical rank orders are shown for two or more strains with indistinguishable virulence. <sup>d</sup>Strain CF27 is not included in Figure 4a; its relative order is inferred based on other experiments. CF, cystic fibrosis; UTI, urinary tract infection.</p>
               </tblfn>
            </tbl>
            <p>In a previous study, Wolfgang and coworkers <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> used Affymetrix GeneChips to survey these same 18 strains (with the exception of PA14) for the presence or absence of PAO1 genes and found no obvious pattern that would correlate genomic content with disease (or the type of infection from which the isolate was derived). Similarly, examination of the distribution of PA14-specific genes among the tested isolates did not reveal any obvious clustering of genomic content with respect to the source of the strain (see dendrogram in Figure <figr fid="F4">4b</figr>).</p>
         </sec>
         <sec>
            <st>
               <p>Identification of PA14-specific virulence genes and their conservation in other strains</p>
            </st>
            <p>The experiments described above showed that there was no correlation between the PA14-specific sequences in general and virulence in the <it>C. elegans </it>killing assay. We therefore performed a functional analysis of PA14-specific ORFs, identifying genes that were specifically required for pathogenicity and subsequently assessing their distribution among the other strains. Our laboratory has constructed a genome-wide, nonredundant transposon insertion mutant library in PA14 <abbrgrp><abbr bid="B24">24</abbr><abbr bid="B25">25</abbr></abbrgrp>. Using this library, we conducted a screen for mutants in PA14-specific genes that had reduced virulence in <it>C. elegans</it>. Nine genes were identified, which fell into six distinct clusters (Table <tblr tid="T3">3</tblr>). Three of these clusters are present in all of the other 19 <it>P. aeruginosa </it>strains but contain highly divergent sequences, including the O-antigen biosynthetic cluster (region PA14R38) and two groups of type 4 fimbrial biogenesis genes (regions PA14R77 and PA14R79). Oligonucleotides corresponding to the PA14-version of the O-antigen biosynthesis genes were included on the array and demonstrated that none of the other strains contain the PA14-versions of these genes; the genes for the two fimbrial synthesis clusters were not included on the array (because the sequences were not sufficiently divergent to meet our criteria for oligonucleotide design as outlined in Additional data file 1).</p>
            <tbl id="T3" hint_layout="double">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>PA14-specific regions containing genes required for <it>C. elegans </it>killing</p>
               </caption>
               <tblbdy cols="8">
                  <r>
                     <c ca="left">
                        <p>PA14 region ID</p>
                     </c>
                     <c ca="left">
                        <p>Number of genes in region</p>
                     </c>
                     <c ca="left">
                        <p>GC content<sup>a</sup></p>
                     </c>
                     <c ca="left">
                        <p>PA14 gene ID</p>
                     </c>
                     <c ca="left">
                        <p>Previously assigned gene name</p>
                     </c>
                     <c ca="left">
                        <p>Gene function</p>
                     </c>
                     <c ca="left">
                        <p>Correlation coefficient of gene with rank order of virulence</p>
                     </c>
                     <c ca="left">
                        <p>Position of gene in Figure 4c</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="8">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PA14R09</p>
                     </c>
                     <c ca="left">
                        <p>14</p>
                     </c>
                     <c ca="left">
                        <p>58.5</p>
                     </c>
                     <c ca="left">
                        <p>PA14_03370<sup>b</sup></p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>Unknown</p>
                     </c>
                     <c ca="left">
                        <p>0.02</p>
                     </c>
                     <c ca="left">
                        <p>1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PA14R38</p>
                     </c>
                     <c ca="left">
                        <p>12</p>
                     </c>
                     <c ca="left">
                        <p>46.4</p>
                     </c>
                     <c ca="left">
                        <p>PA14_23420<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>ORF_10</p>
                     </c>
                     <c ca="left">
                        <p>O-antigen biosynthesis</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>2<sup>c</sup></p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>PA14_23430</p>
                     </c>
                     <c ca="left">
                        <p>ORF_11</p>
                     </c>
                     <c ca="left">
                        <p>O-antigen biosynthesis</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>3<sup>c</sup></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PA14R41</p>
                     </c>
                     <c ca="left">
                        <p>8</p>
                     </c>
                     <c ca="left">
                        <p>66</p>
                     </c>
                     <c ca="left">
                        <p>PA14_27680<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>C118</p>
                     </c>
                     <c ca="left">
                        <p>Unknown</p>
                     </c>
                     <c ca="left">
                        <p>0.63</p>
                     </c>
                     <c ca="left">
                        <p>4</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>PA14_27700<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>C120</p>
                     </c>
                     <c ca="left">
                        <p>Putative transcriptional regulator</p>
                     </c>
                     <c ca="left">
                        <p>0.63</p>
                     </c>
                     <c ca="left">
                        <p>5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PA14R77</p>
                     </c>
                     <c ca="left">
                        <p>3</p>
                     </c>
                     <c ca="left">
                        <p>53.9</p>
                     </c>
                     <c ca="left">
                        <p>PA14_58760</p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>pilC</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>Type 4 fimbrial biogenesis</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>Not on oligo array<sup>c</sup></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PA14R78</p>
                     </c>
                     <c ca="left">
                        <p>112</p>
                     </c>
                     <c ca="left">
                        <p>59.7</p>
                     </c>
                     <c ca="left">
                        <p>PA14_59010<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>RL107</p>
                     </c>
                     <c ca="left">
                        <p>Unknown</p>
                     </c>
                     <c ca="left">
                        <p>0.44</p>
                     </c>
                     <c ca="left">
                        <p>6</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>PA14_59070</p>
                     </c>
                     <c ca="left">
                        <p>RL102</p>
                     </c>
                     <c ca="left">
                        <p>Unknown</p>
                     </c>
                     <c ca="left">
                        <p>0.44</p>
                     </c>
                     <c ca="left">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PA14R79</p>
                     </c>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="left">
                        <p>54.9</p>
                     </c>
                     <c ca="left">
                        <p>PA14_60290<sup>b</sup></p>
                     </c>
                     <c ca="left">
                        <p>
                           <it>pilW</it>
                        </p>
                     </c>
                     <c ca="left">
                        <p>Type 4 fimbrial biogenesis</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>Not on oligo array<sup>c</sup></p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a</sup>GC content of the PA14 genome is 66.3 &#177; 4.3%. <sup>b</sup>These mutants were grown on minimal media and all had wild-type growth curves. <sup>c</sup>These gene clusters are present in all <it>P. aeruginosa </it>isolates, but the sequences are highly divergent. Oligos for the PA14-specific O-antigen cluster were included on the array, but none of the other strains contained the PA14-version of these genes. The two clusters involved in type 4 fimbrial biogenesis were not included on the array because the sequences were not sufficiently different to pass our criteria for oligo design (see Materials and methods).</p>
               </tblfn>
            </tbl>
            <p>The remaining three clusters contain genes that are absent in PAO1. As indicated in Table <tblr tid="T3">3</tblr>, these three clusters contain five virulence genes, including one gene with putative transcriptional regulator activity and four ORFs of unknown function. Figure <figr fid="F4">4c</figr> summarizes the array data for these three regions. Each of the 20 strains tested are represented in columns arranged from left to right in order of decreasing pathogenicity (see Table <tblr tid="T2">2</tblr> for rank order of virulence). The PA14 genes tested (shown in rows) are described as present (blue), absent (yellow), or indeterminate (red, indicating that the hybridization intensity was intermediate and a present or absent call could not be made with confidence; see <supplr sid="S1">Additional data file 1</supplr> for further details). The positions of the genes that result in an avirulent phenotype when mutated in PA14 are indicated on the right (also see Table <tblr tid="T3">3</tblr>). If a cluster of genes was required for or predictive of virulence in nematodes then we would expect to see a bias for present (blue) calls toward the left and absent (yellow) calls toward the right.</p>
            <p>For these five virulence genes (and their associated three clusters), Spearman's rank correlation coefficients (relating their presence, absence, or indeterminate status with the virulence of the strain) were found to vary dramatically. The best correlation was found for two genes in region PA14R41 (correlation coefficients of 0.63). This is a cluster of eight genes known as the clone C-specific region common to clone C isolates (members of a clone family associated with CF infections <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>). Intermediate to no correlations were observed for the remaining two regions, namely PA14R78 and PAR09, which had correlation coefficients of 0.44 and 0.02, respectively. Of note, PA14R78 is a previously described pathogenicity island (PAPI-1) shown to contain genes required for pathogenicity in plants and mammals <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>, although the two mutations in genes of unknown function that we identified in this cluster (PA14_59010 and PA14_59070; positions 6 and 7 in Figure <figr fid="F4">4c</figr>) were not among those previously examined. Regardless of the magnitude of the correlation, each virulence gene had exceptions to the expected trend, being present in attenuated strains and/or absent in virulent strains. Taken together, the functionally defined PA14 genes required for <it>C. elegans </it>killing are neither required for nor necessarily predictive of another strain's ability to be pathogenic.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>In this study we combined a traditional comparative genomic analysis with functional analyses, including genomotyping of other isolates, use of a genome-wide mutant library, and a model host infection system amenable to high-throughput screens, to ascertain the relationship between genomic content and virulence. We have found that PA14 and PAO1 are remarkably similar in total content and are largely colinear (with the exception of a previously described inversion). Because PA14 is significantly more virulent than PAO1 in most hosts, and previous studies have identified PA14 pathogenicity genes in regions that are absent in PAO1, we extended these observations to examine all of the PA14-specific genes for potential contributions to virulence. We began by examining 18 additional diverse isolates to assess the conservation of PA14-specific genes in other strains and whether they correlated with pathogenicity. In general, there was no obvious relationship between the presence of PA14-specific or PAO1-specific genes in other isolates and their virulence in <it>C. elegans </it>or the source of the strain. A specific examination of genes in these PA14-specific regions that were experimentally shown to contribute to virulence also failed to show a strong correlation between the presence of these genes and the pathogenicity of other isolates.</p>
         <p>Our results amend the general view of pathogenicity islands, in which the acquisition of an island leads to the addition of gene products whose contribution to virulence is apparent based on the known function of the virulence gene and does not depend (necessarily) on genes outside of the island. For example, an island may contain a complete complement of genes required for the synthesis of secreted toxins, adhesins, invasion systems, iron uptake systems, or secretion systems (such as the type III and type IV systems) <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr></abbrgrp>. In these 'classic' cases, the presence or absence of individual pathogenicity islands correlates directly with a given gene product or process known to be required for virulence (and, therefore, with overall virulence). <it>P. aeruginosa </it>strains contain genes that fall into this category; for example, the presence of a pathogenicity island containing the type III secretion effector ExoU (present on PA14 region PA14R72) makes strains more cytotoxic to mammalian cells <abbrgrp><abbr bid="B27">27</abbr></abbrgrp> and is required for pathogenicity in <it>Galleria </it>and the amoeba <it>Dictyostelium discoideum </it><abbrgrp><abbr bid="B16">16</abbr><abbr bid="B28">28</abbr></abbrgrp>. However, we have also identified PA14 pathogenicity-related genes whose presence or absence does not correlate directly with degree of virulence, suggesting that these genes do not function autonomously to affect virulence. Our genomic analysis of PA14 virulence has demonstrated that pathogenicity in this organism is both multifactorial and combinatorial. Within a given isolate, virulence is multifactorial in that several factors combine to result in an overall virulence phenotype. Additionally, when comparing different strains, virulence is combinatorial in that pathogenicity factors may behave differently and that distinct combinations or groupings of these determinants may result in comparable virulence phenotypes.</p>
         <p>What might account for the apparent complexity of PA14-specific virulence factors with respect to their conservation and role in other strains? First, it is clear that our analysis of genomic content in other strains is only an initial step in addressing similarities or differences in gene function among isolates; the apparent absence of a gene cannot exclude the existence of a functionally similar gene with significant sequence divergence, and the apparent presence of a gene cannot determine whether a gene is expressed. Transcriptional profiling of strain-specific genes (particularly in the presence of a putative host) will be a critical next step in clarifying the genes that contribute to virulence. Additional sequence information from other strains will be required to determine whether other functionally similar genes exist or whether orthologous genes are likely to be fully functional (intact ORFs with no polymorphisms that might alter protein function). Second, given the multifactorial and combinatorial nature of <it>P. aeruginosa </it>virulence, a full understanding of pathogenicity will require elucidation of how strain-specific genes (potentially responsible for differences in severity of disease among isolates) interact with core genome genes required for a base level of virulence. Our laboratory is currently extending the screen for PA14 mutants attenuated in <it>C. elegans </it>killing beyond the PA14-specific genes to include the entire genome (Liberati NT, Feinbaum RL, Ausubel FM, unpublished observations). Third, an important future direction will be to determine how generalizable our observations are in other model hosts. We are currently conducting pilot experiments to assess the viability of screening both the set of 20 <it>P. aeruginosa </it>strains and the PA14 mutant library in insects and plants to determine whether the presence or absence of identified PA14 virulence genes in other isolates correlates with their overall pathogenicity. A thorough understanding of networks of genes that are necessary for virulence in many or the majority of <it>P. aeruginosa </it>isolates (as opposed to genes that contribute to pathogenicity only in a subset of strains in which they are present) will be crucial for the design of effective therapeutics to combat the wide variety of human infections observed in clinical settings.</p>
         <p>The evolution of virulence for a dedicated human pathogen generally involves the acquisition of discrete virulence functions required for specific interactions with the host, followed by gene loss related to specialization and potential restriction to the new environmental niche. In contrast, ubiquitous environmental micro-organisms continuously encounter dramatic changes in their ecosystem and the maintenance of genome complexity is preferable to optimization for a single niche. For environmental pathogenic fungi such as <it>Cryptococcus neoformans </it>that do not require animal hosts for replication or survival, the phenomenon of 'ready made' virulence has been described in which the selection and maintenance of virulence factors occurs during infection of environmental predators such as nematodes and ameba <abbrgrp><abbr bid="B29">29</abbr><abbr bid="B30">30</abbr><abbr bid="B31">31</abbr></abbrgrp>. We propose that this multi-host view of pathogenic evolution also applies to environmental bacteria such as <it>P. aeruginosa </it>that infects nematodes, insects, plants, and ameba in the laboratory and probably encounter a similar range of potential hosts in the wild. The recent discovery that <it>C. elegans </it>pre-exposed to PA14 can modify its olfactory preferences to avoid the pathogen, and that this 'learned' avoidance behavior does not occur with nonpathogenic mutants of PA14, suggests that an interaction between these two organisms is biologically relevant <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. Therefore, selection for pathogenicity may occur constantly in the environment; indeed, among the 20 isolates surveyed in this study, two environmental strains (MSH3 and MSH10) were among the most virulent, demonstrating that pathogenic potential exists even in nonclinical isolates. Furthermore, as an environmental organism, <it>P. aeruginosa </it>is not likely to undergo genome reduction associated with host restriction as in dedicated human pathogens. A notable exception is the case of CF infections, in which a clonal population remains isolated in a defined environment over a long period of time and tends not to spread to other patients. Indeed, a recent comparison of an early and late CF isolate from the same patient (at 6 months and 8 years of age) revealed an accumulation of multiple mutations leading to gene inactivation or loss, including a large 188 kb deletion <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>. When these mutated genes were examined in early and late infections of 29 additional CF patients, most of the observed mutations arose relatively late in the infections.</p>
         <p>Our laboratory and others have previously shown that aspects of PA14 pathogenicity are conserved in model hosts and in mammalian hosts; PA14 virulence factors have been shown to be required for disease in both model hosts and mammals <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B16">16</abbr><abbr bid="B17">17</abbr><abbr bid="B19">19</abbr><abbr bid="B28">28</abbr><abbr bid="B34">34</abbr></abbrgrp>, and components of the host defense response are conserved in model hosts and humans <abbrgrp><abbr bid="B34">34</abbr><abbr bid="B35">35</abbr><abbr bid="B36">36</abbr></abbrgrp>. Although these observations are critical in validating the use of simple, genetically tractable organisms as surrogate hosts to study human disease, perhaps the more appropriate perspective is to view nematodes, insects, plants, and ameba as the relevant natural hosts in which the selection for and evolution of pathogenic traits occurs, and the ability to subsequently infect humans is a secondary effect of these interactions.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Shotgun genome sequencing</p>
            </st>
            <p>Shotgun sequencing of PA14 was performed using 65,800 plasmids containing 2-4 kb fragments of genomic PA14 DNA, resulting in over 10-fold coverage. Sequence reads were assembled using the Phred, Phrap, and Consed tools <abbrgrp><abbr bid="B37">37</abbr><abbr bid="B38">38</abbr><abbr bid="B39">39</abbr></abbrgrp>. Details of finishing methods are described in Additional data file 1.</p>
            <p>A long-range PCR-based method was used to assess whether particular <it>P. aeruginosa </it>genomes contain a PA14-like or a PAO1-like arrangement of genome sequence between the two most distant copies of a large ribosomal RNA cluster (Figures <figr fid="F1">1</figr> and <figr fid="F2">2a,b</figr>; also see Stover and coworkers <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>). Primer pairs used to amplify two products specific for the PA14 chromosomal arrangement are as follows: 807.LL_rev (CGAACTGGAGGAAGTCTTCG) + 2-5'_2 (CGAGGCTTTCGTCTATCCAG), and 837.LL (AACTGGTGGAGGGAGAAGGAT) + 803.RR.rev (TAGCCTTCAATTCCACCTGG). Primer combinations used to amplify two PAO1-specific products are as follows: 807.LL_rev + 803.RR.rev, and 837.LL + 2-5'_2. These diagnostic primer pairs were also used to survey 18 additional strains (Table <tblr tid="T2">2</tblr>) to determine whether the PA14 or the PAO1 orientation was more representative of the ancestral <it>P. aeruginosa </it>chromosome. Of the 18 strains tested, none generated a PAO1-specific amplification product. Using the primers for the PA14 arrangement, seven of the 18 strains yielded products with both primer pairs, nine of 18 had a strong PCR product with one of the two primer pairs and a weak product with the second primer pair, and two of 18 exhibited a weak product with one primer pair and no product with the second.</p>
         </sec>
         <sec>
            <st>
               <p>Sequence analysis and gene annotation</p>
            </st>
            <p>In determining GC content for PA14 and PAO1, standard deviations were determined using a continuous sliding window of 1 kb, and comparing the GC content for these regions with that of the whole genome. GC skew analysis was performed (using the formula GC skew = [n(G) - n(C)]/[n(G) + n(C)], where n [i] is the number of nucleotides, applied to 1 kb segments of each genome) to identify the peak cumulative GC skew as the likely position of the replication terminus <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. Global alignments of the PA14 and PAO1 genomes were performed using the MUMmer 3.0 software package <abbrgrp><abbr bid="B40">40</abbr></abbrgrp> to identify strain-specific regions. Automated ORF predictions were made using a combination of the BLAST and Glimmer2 algorithms <abbrgrp><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>. Each predicted ORF was assigned a PA14 LocusName, beginning with 'PA14_' followed by five numerals. ORFs were numbered starting with PA14_00010 (<it>dnaA</it>), increasing in increments of 10 to allow for future insertions of additional genes or functional RNAs. Further details of ORF prediction and annotation are provided in Additional data file 1.</p>
         </sec>
         <sec>
            <st>
               <p>Microarray genomotyping of <it>P. aeruginosa </it>strains</p>
            </st>
            <p>70-mer oligonucleotides for microarrays were designed as described previously <abbrgrp><abbr bid="B43">43</abbr></abbrgrp> for 285 PA14-specific sequences, 130 PAO1-specific sequences, 11 genes common to both strains (to serve as positive controls), and additional genes and negative controls (see Additional data file 1). Chromosomal DNA from PA14, PAO1 (the sequenced isolate), and 18 additional <it>P. aeruginosa </it>strains described previously <abbrgrp><abbr bid="B9">9</abbr></abbrgrp> was digested with HaeIII and labeled with Cyanine-3 or Cyanine-5 using the MICROMAX ASAP labeling kit (part #MPS544001KT; PerkinElmer, Wellesley, MA, USA). Labeled samples were combined in random pairs and hybridized to the arrays. Observed intensities for replicate hybridizations for each strain were averaged and log2 ratios were computed to determine the presence/absence of each gene based on a cut-off determined independently for each sample (see Additional data file 1). For each gene, a Spearman's rank correlation coefficient was calculated to describe the relationship between the spectrum of present/absent calls and the determined rank order virulence in <it>C. elegans </it>(see below). Heirarchical clustering analysis of strain relationships was performed using Cluster 3.0 <abbrgrp><abbr bid="B44">44</abbr></abbrgrp> and Java Treeview <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>. All microarray data are included in Additional data files 5 and 6 and have also been deposited in ArrayExpress (ArrayExpress E-MEXP-824).</p>
         </sec>
         <sec>
            <st>
               <p><it>C. elegans </it>pathogenicity assays</p>
            </st>
            <p>The 20 <it>P. aeruginosa </it>strains analyzed by genomotyping were cultured overnight in Luria broth (LB) and assayed in the <it>C. elegans </it>killing system as described previously <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, with the exception that assays were performed using <it>fer-15(b26)ts;fem-1(hc17) </it>temperature-sensitive sterile mutant nematodes. The assays were carried out at the restrictive temperature (25&#176;C) to prevent progeny formation and to allow the experiments to continue long enough to examine less pathogenic strains (for which progeny would typically overwhelm the assay plate by the end of the experiment). Bacterial strains are rank ordered from most to least virulent based on the position of the LT<sub>50 </sub>(the time at which 50% lethality was observed) in Figure <figr fid="F4">4a</figr>. In cases in which the LT<sub>50 </sub>was overlapping, rank orders were represented as a tied value for the strains in question. Strain CF27 is not included in the data shown in Figure <figr fid="F4">4a</figr>; however, its rank order in a similar experiment places it between strains E2 and S35004. The relative rank orders shown in Figure <figr fid="F4">4a</figr> are consistent with those observed in two additional experiments; although the absolute LT<sub>50 </sub>values increased or decreased for given strains between experiments, the relative rank orders remained consistent.</p>
            <p>To screen for avirulent PA14 mutants, we utilized a nonredundant transposon insertion library <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. All available mutants in PA14-specific genes (349 in total) were grown in 150 ml of LB media in 0.5 ml 96-well Masterblocks (part #786261; Greiner, Monroe, NC, USA). Cultures were agitated at 225 rpm and incubated for 16 hours at 37&#176;C. A volume of 10 &#956;l of each culture was spotted onto slow killing agar in 2 wells of a six-well plate <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B18">18</abbr></abbrgrp>, allowed to grow at 37&#176;C for 24 hours, and left at room temperature for an additional 24 hours. Five L4 stage N2 nematodes were transferred manually to each well, and the number and age of progeny were recorded after 4 days at 25&#176;C. The 349 mutants in PA14-specific genes were screened on two separate occasions, and any that were highly attenuated in either screen or were attenuated in both screens were re-examined in a secondary screen as described using wild-type N2 nematodes <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. Six mutants were tested for growth in minimal (M63) media and all were found to have wild-type growth curves (Table <tblr tid="T3">3</tblr>). These included four of the five mutants in PA14 genes completely absent in PAO1 (examined in Figure <figr fid="F4">4c</figr>).</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this paper. Additional data file <supplr sid="S1">1</supplr> is a document summarizing supplementary methods. Additional data file <supplr sid="S2">2</supplr> is a table of PA14 gene annotations: the first worksheet contains the data, and the second worksheet contains a detailed description of the contents of the table and serves as a legend for the first worksheet. Additional data file <supplr sid="S3">3</supplr> is a table showing the percentage of PA14 and PAO1 genes corresponding to each of 28 functional categories (shown for both the whole genome and strain-specific genes as described in Additional data file 4): the first worksheet contains the data, and the second worksheet contains a detailed description of the contents of the table and serves as a legend for the first worksheet. Additional data file <supplr sid="S4">4</supplr> is a table summarizing properties of PA14-specific and PAO1-specific regions: the first worksheet contains the data, and the second worksheet contains a detailed description of the contents of the table and serves as a legend for the first worksheet. Additional data file <supplr sid="S5">5</supplr> is a table describing the properties of oligos found on the genotyping microarray: the first worksheet contains the data, and the second worksheet contains a detailed description of the contents of the table and serves as a legend for the first worksheet. Additional data file <supplr sid="S6">6</supplr> is a table of the microarray genotyping data for the 20 strains examined in this study (normalized average data and log2 ratio of normalized averages): the first worksheet contains the data, and the second worksheet contains a detailed description of the contents of the table and serves as a legend for the first worksheet. Additional data file <supplr sid="S7">7</supplr> contains the coordinates of regions in PA14 or PAO1 that are common to four sequenced <it>P. aeruginosa </it>strains (PA14, PAO1, and two CF isolates: 2192 and C3719) and therefore comprise a putative <it>P. aeruginosa </it>core genome: the first worksheet contains the data, and the second worksheet contains a detailed description of the contents of the table and serves as a legend for the first worksheet.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Summary of supplementary methods</p>
            </caption>
            <text>
               <p>Summary of supplementary methods.</p>
            </text>
            <file name="gb-2006-7-10-r90-S1.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S2">
            <title>
               <p>Additional data file 2</p>
            </title>
            <caption>
               <p>PA14 gene annotations</p>
            </caption>
            <text>
               <p>A table of PA14 gene annotations.</p>
            </text>
            <file name="gb-2006-7-10-r90-S2.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S3">
            <title>
               <p>Additional data file 3</p>
            </title>
            <caption>
               <p>The percentage of PA14 and PAO1 genes corresponding to each of 28 functional categories (shown for both the whole genome and strain-specific genes as described in Additional data file 4)</p>
            </caption>
            <text>
               <p>The percentage of PA14 and PAO1 genes corresponding to each of 28 functional categories (shown for both the whole genome and strain-specific genes as described in Additional data file 4).</p>
            </text>
            <file name="gb-2006-7-10-r90-S3.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S4">
            <title>
               <p>Additional data file 4</p>
            </title>
            <caption>
               <p>Summary of properties of PA14-specific and PAO1-specific regions</p>
            </caption>
            <text>
               <p>Summary of properties of PA14-specific and PAO1-specific regions.</p>
            </text>
            <file name="gb-2006-7-10-r90-S4.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S5">
            <title>
               <p>Additional data file 5</p>
            </title>
            <caption>
               <p>Properties of oligos found on the genotyping microarray</p>
            </caption>
            <text>
               <p>Properties of oligos found on the genotyping microarray.</p>
            </text>
            <file name="gb-2006-7-10-r90-S5.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S6">
            <title>
               <p>Additional data file 6</p>
            </title>
            <caption>
               <p>Microarray genotyping data for the 20 strains examined in this study (normalized average data and log2 ratio of normalized averages)</p>
            </caption>
            <text>
               <p>Microarray genotyping data for the 20 strains examined in this study (normalized average data and log2 ratio of normalized averages).</p>
            </text>
            <file name="gb-2006-7-10-r90-S6.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
         <suppl id="S7">
            <title>
               <p>Additional data file 7</p>
            </title>
            <caption>
               <p>Coordinates of regions in PA14 or PAO1 that are common to four sequenced <it>P. aeruginosa </it>strains (PA14, PAO1, and two CF isolates: 2192 and C3719) and therefore comprise a putative <it>P. aeruginosa </it>core genome</p>
            </caption>
            <text>
               <p>Coordinates of regions in PA14 or PAO1 that are common to four sequenced <it>P. aeruginosa </it>strains (PA14, PAO1, and two CF isolates: 2192 and C3719) and therefore comprise a putative <it>P. aeruginosa </it>core genome.</p>
            </text>
            <file name="gb-2006-7-10-r90-S7.xls">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>DGL and FMA were responsible for strategic planning and managing the overall project. LL, GG, KM, and RK were responsible for overseeing the raw sequencing, finishing, and initial assembly of PA14. DGL, NTL, SM, JH, and MS contributed to the raw sequencing effort. DGL performed manual edits to the assembly and additional finishing reactions. JMU and GW developed bioinformatic tools to analyze the sequence data. JMU, GW, and DGL performed the bulk of the bioinformatic analyses. DGL, JMU, LTD, NTL, JH, ED, and LF contributed to the manual annotation of PA14 genes. DGL designed the oligonucleotide array, performed the microarray experiments, and DGL and JMU analyzed the microarray data. NTL and RF performed the <it>C. elegans </it>assays. DGL and FMA wrote the paper. All authors discussed the results and commented on the manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We thank J Decker, W Brown, K Osborn, A Perera, R Elliott, and L Gendal for technical assistance during the sequencing of PA14; R Jackson for suggestions on genomic DNA preparations for microarray analysis; N El Massadi and J Frietas for suggestions on sample labelling, hybridizations, and scanning for microarray experiments; D Park for assistance with microarray data analysis; and E Mylonakis for discussions regarding the evolution of fungal pathogens. We especially acknowledge S Lory for encouragement and for many helpful discussions and suggestions. This work was funded by grants to FMA from the National Institutes of Health (Grant Numbers U01 HL66678 and R01 AI064332) and the Department of Energy (Grant Number DE-FG02-ER63445), a postdoctoral fellowship from the Jane Coffin Childs Memorial fund for Medical Research to DGL, and by support from the Harvard-Partners Center for Genetics and Genomics.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Pathogenicity islands of virulent bacteria: structure, function and impact on microbial evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Hacker</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Blum-Oehler</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Muhldorfer</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Tschape</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>1997</pubdate>
            <volume>23</volume>
            <fpage>1089</fpage>
            <lpage>1097</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1046/j.1365-2958.1997.3101672.x</pubid>
                  <pubid idtype="pmpid">9106201</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Impact of pathogenicity islands in bacterial diagnostics.</p>
            </title>
            <aug>
               <au>
                  <snm>Oelschlaeger</snm>
                  <fnm>TA</fnm>
               </au>
               <au>
                  <snm>Hacker</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Apmis</source>
            <pubdate>2004</pubdate>
            <volume>112</volume>
            <fpage>930</fpage>
            <lpage>936</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1600-0463.2004.apm11211-1214.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15638844</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Comparative genomic structure of prokaryotes.</p>
            </title>
            <aug>
               <au>
                  <snm>Bentley</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Parkhill</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Annu Rev Genet</source>
            <pubdate>2004</pubdate>
            <volume>38</volume>
            <fpage>771</fpage>
            <lpage>792</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.genet.38.072902.094318</pubid>
                  <pubid idtype="pmpid" link="fulltext">15568993</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>The nature and dynamics of bacterial genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Ochman</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Davalos</snm>
                  <fnm>LM</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2006</pubdate>
            <volume>311</volume>
            <fpage>1730</fpage>
            <lpage>1733</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1119966</pubid>
                  <pubid idtype="pmpid" link="fulltext">16556833</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Chronic Pseudomonas aeruginosa lung infection in cystic fibrosis patients.</p>
            </title>
            <aug>
               <au>
                  <snm>Doring</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Pseudomonas aeruginosa as an opportunistic pathogen</source>
            <publisher>New York: Plenum Press</publisher>
            <pubdate>1993</pubdate>
            <fpage>245</fpage>
            <lpage>273</lpage>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Pseudomonas: the compromised host.</p>
            </title>
            <aug>
               <au>
                  <snm>Wood</snm>
                  <fnm>RE</fnm>
               </au>
            </aug>
            <source>Hosp Pract</source>
            <pubdate>1976</pubdate>
            <volume>11</volume>
            <fpage>91</fpage>
            <lpage>100</lpage>
            <xrefbib>
               <pubid idtype="pmpid">829230</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Complete genome sequence of <it>Pseudomonas aeruginosa</it> PA01, an opportunistic pathogen.</p>
            </title>
            <aug>
               <au>
                  <snm>Stover</snm>
                  <fnm>CK</fnm>
               </au>
               <au>
                  <snm>Pham</snm>
                  <fnm>XQ</fnm>
               </au>
               <au>
                  <snm>Erwin</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Mizoguchi</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Warrener</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Hickey</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Brinkman</snm>
                  <fnm>FS</fnm>
               </au>
               <au>
                  <snm>Hufnagle</snm>
                  <fnm>WO</fnm>
               </au>
               <au>
                  <snm>Kowalik</snm>
                  <fnm>DJ</fnm>
               </au>
               <au>
                  <snm>Lagrou</snm>
                  <fnm>M</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nature</source>
            <pubdate>2000</pubdate>
            <volume>406</volume>
            <fpage>959</fpage>
            <lpage>964</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35023079</pubid>
                  <pubid idtype="pmpid" link="fulltext">10984043</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Genome mosaicism is conserved but not unique in <it>Pseudomonas aeruginosa</it> isolates from the airways of young children with cystic fibrosis.</p>
            </title>
            <aug>
               <au>
                  <snm>Ernst</snm>
                  <fnm>RK</fnm>
               </au>
               <au>
                  <snm>D'Argenio</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Ichikawa</snm>
                  <fnm>JK</fnm>
               </au>
               <au>
                  <snm>Bangera</snm>
                  <fnm>MG</fnm>
               </au>
               <au>
                  <snm>Selgrade</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Burns</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Hiatt</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>McCoy</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Brittnacher</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kas</snm>
                  <fnm>A</fnm>
               </au>
               <etal/>
            </aug>
            <source>Environ Microbiol</source>
            <pubdate>2003</pubdate>
            <volume>5</volume>
            <fpage>1341</fpage>
            <lpage>1349</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1462-2920.2003.00518.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">14641578</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Conservation of genome content and virulence determinants among clinical and environmental isolates of <it>Pseudomonas aeruginosa</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Wolfgang</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Kulasekara</snm>
                  <fnm>BR</fnm>
               </au>
               <au>
                  <snm>Liang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Boyd</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Miyada</snm>
                  <fnm>CG</fnm>
               </au>
               <au>
                  <snm>Lory</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2003</pubdate>
            <volume>100</volume>
            <fpage>8484</fpage>
            <lpage>8489</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">166255</pubid>
                  <pubid idtype="pmpid" link="fulltext">12815109</pubid>
                  <pubid idtype="doi">10.1073/pnas.0832438100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Whole-genome sequence variation among multiple isolates of <it>Pseudomonas aeruginosa</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Spencer</snm>
                  <fnm>DH</fnm>
               </au>
               <au>
                  <snm>Kas</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Raymond</snm>
                  <fnm>CK</fnm>
               </au>
               <au>
                  <snm>Sims</snm>
                  <fnm>EH</fnm>
               </au>
               <au>
                  <snm>Hastings</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Burns</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Kaul</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Olson</snm>
                  <fnm>MV</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2003</pubdate>
            <volume>185</volume>
            <fpage>1316</fpage>
            <lpage>1325</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">142842</pubid>
                  <pubid idtype="pmpid" link="fulltext">12562802</pubid>
                  <pubid idtype="doi">10.1128/JB.185.4.1316-1325.2003</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Identification of virulence genes in a pathogenic strain of <it>Pseudomonas aeruginosa </it>by representational difference analysis.</p>
            </title>
            <aug>
               <au>
                  <snm>Choi</snm>
                  <fnm>JY</fnm>
               </au>
               <au>
                  <snm>Sifri</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Goumnerov</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
               <au>
                  <snm>Calderwood</snm>
                  <fnm>SB</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2002</pubdate>
            <volume>184</volume>
            <fpage>952</fpage>
            <lpage>961</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">134824</pubid>
                  <pubid idtype="pmpid" link="fulltext">11807055</pubid>
                  <pubid idtype="doi">10.1128/jb.184.4.952-961.2002</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Common virulence factors for bacterial pathogenicity in plants and animals.</p>
            </title>
            <aug>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Stevens</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Wolfort</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Shao</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tompkins</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1995</pubdate>
            <volume>268</volume>
            <fpage>1899</fpage>
            <lpage>1902</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.7604262</pubid>
                  <pubid idtype="pmpid" link="fulltext">7604262</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Killing of <it>Caenorhabditis elegans </it>by <it>Pseudomonas aeruginosa </it>used to model mammalian bacterial pathogenesis.</p>
            </title>
            <aug>
               <au>
                  <snm>Tan</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Mahajan-Miklos</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1999</pubdate>
            <volume>96</volume>
            <fpage>715</fpage>
            <lpage>720</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">15202</pubid>
                  <pubid idtype="pmpid" link="fulltext">9892699</pubid>
                  <pubid idtype="doi">10.1073/pnas.96.2.715</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Positive correlation between virulence of <it>Pseudomonas aeruginosa </it>mutants in mice and insects.</p>
            </title>
            <aug>
               <au>
                  <snm>Jander</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>J Bacteriol</source>
            <pubdate>2000</pubdate>
            <volume>182</volume>
            <fpage>3843</fpage>
            <lpage>3845</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">94559</pubid>
                  <pubid idtype="pmpid" link="fulltext">10851003</pubid>
                  <pubid idtype="doi">10.1128/JB.182.13.3843-3845.2000</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Molecular mechanisms of bacterial virulence elucidated using a <it>Pseudomonas aeruginosa-Caenorhabditis elegans </it>pathogenesis model.</p>
            </title>
            <aug>
               <au>
                  <snm>Mahajan-Miklos</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1999</pubdate>
            <volume>96</volume>
            <fpage>47</fpage>
            <lpage>56</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(00)80958-7</pubid>
                  <pubid idtype="pmpid" link="fulltext">9989496</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Use of the <it>Galleria mellonella </it>caterpillar as a model host to study the role of the type III secretion system in <it>Pseudomonas aeruginosa </it>pathogenesis.</p>
            </title>
            <aug>
               <au>
                  <snm>Miyata</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Casey</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Frank</snm>
                  <fnm>DW</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
               <au>
                  <snm>Drenkard</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>Infect Immun</source>
            <pubdate>2003</pubdate>
            <volume>71</volume>
            <fpage>2404</fpage>
            <lpage>2413</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">153283</pubid>
                  <pubid idtype="pmpid" link="fulltext">12704110</pubid>
                  <pubid idtype="doi">10.1128/IAI.71.5.2404-2413.2003</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Use of model plant hosts to identify <it>Pseudomonas aeruginosa </it>virulence factors.</p>
            </title>
            <aug>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Le</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Tompkins</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Calderwood</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1997</pubdate>
            <volume>94</volume>
            <fpage>13245</fpage>
            <lpage>13250</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">24294</pubid>
                  <pubid idtype="pmpid" link="fulltext">9371831</pubid>
                  <pubid idtype="doi">10.1073/pnas.94.24.13245</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p><it>Pseudomonas aeruginosa </it>killing of <it>Caenorhabditis elegans </it>used to identify <it>P. aeruginosa </it>virulence factors.</p>
            </title>
            <aug>
               <au>
                  <snm>Tan</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Sternberg</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Tompkins</snm>
                  <fnm>RG</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1999</pubdate>
            <volume>96</volume>
            <fpage>2408</fpage>
            <lpage>2413</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">26797</pubid>
                  <pubid idtype="pmpid" link="fulltext">10051655</pubid>
                  <pubid idtype="doi">10.1073/pnas.96.5.2408</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>The broad host range pathogen <it>Pseudomonas aeruginosa </it>strain PA14 carries two pathogenicity islands harboring plant and animal virulence genes.</p>
            </title>
            <aug>
               <au>
                  <snm>He</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Baldini</snm>
                  <fnm>RL</fnm>
               </au>
               <au>
                  <snm>Deziel</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Saucier</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Liberati</snm>
                  <fnm>NT</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Urbach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Goodman</snm>
                  <fnm>HM</fnm>
               </au>
               <au>
                  <snm>Rahme</snm>
                  <fnm>LG</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <fpage>2530</fpage>
            <lpage>2535</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">356984</pubid>
                  <pubid idtype="pmpid" link="fulltext">14983043</pubid>
                  <pubid idtype="doi">10.1073/pnas.0304622101</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>PA14 Gene Annotations</p>
            </title>
            <url>http://ausubellab.mgh.harvard.edu/cgi-bin/pa14/annotation/start.cgi</url>
         </bibl>
         <bibl id="B21">
            <title>
               <p>A minimal tiling path cosmid library for functional analysis of the <it>Pseudomonas aeruginosa </it>PAO1 genome.</p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Whitchurch</snm>
                  <fnm>CB</fnm>
               </au>
               <au>
                  <snm>Croft</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Beatson</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Mattick</snm>
                  <fnm>JS</fnm>
               </au>
            </aug>
            <source>Microb Comp Genomics</source>
            <pubdate>2000</pubdate>
            <volume>5</volume>
            <fpage>189</fpage>
            <lpage>203</lpage>
            <xrefbib>
               <pubid idtype="pmpid">11471833</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Pseudomonas Genome Project and PseudoCAP</p>
            </title>
            <url>http://www.pseudomonas.com/</url>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Improved analytical methods for microarray-based genome-composition analysis.</p>
            </title>
            <aug>
               <au>
                  <snm>Kim</snm>
                  <fnm>CC</fnm>
               </au>
               <au>
                  <snm>Joyce</snm>
                  <fnm>EA</fnm>
               </au>
               <au>
                  <snm>Chan</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Falkow</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Genome Biol</source>
            <pubdate>2002</pubdate>
            <volume>3</volume>
            <fpage>RESEARCH0065</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">133449</pubid>
                  <pubid idtype="pmpid" link="fulltext">12429064</pubid>
                  <pubid idtype="doi">10.1186/gb-2002-3-11-research0065</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>PA14 Transposon Insertion Mutant Library</p>
            </title>
            <url>http://ausubellab.mgh.harvard.edu/cgi-bin/pa14/home.cgi</url>
         </bibl>
         <bibl id="B25">
            <title>
               <p>An ordered, nonredundant library of <it>Pseudomonas aeruginosa </it>strain PA14 transposon insertion mutants.</p>
            </title>
            <aug>
               <au>
                  <snm>Liberati</snm>
                  <fnm>NT</fnm>
               </au>
               <au>
                  <snm>Urbach</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Miyata</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Drenkard</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Villanueva</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ausubel</snm>
                  <fnm>FM</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>2833</fpage>
            <lpage>2838</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1413827</pubid>
                  <pubid idtype="pmpid" link="fulltext">16477005</pubid>
                  <pubid idtype="doi">10.1073/pnas.0511100103</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Worldwide distribution of <it>Pseudomonas aeruginosa </it>clone C strains in the aquatic environment and cystic fibrosis patients.</p>
            </title>
            <aug>
               <au>
                  <snm>Romling</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Kader</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sriramulu</snm>
                  <fnm>DD</fnm>
               </au>
               <au>
                  <snm>Simm</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Kronvall</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Environ Microbiol</source>
            <pubdate>2005</pubdate>
            <volume>7</volume>
            <fpage>1029</fpage>
            <lpage>1038</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1462-2920.2005.00780.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15946300</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>ExoU is a potent intracellular phospholipase.</p>
            </title>
            <aug>
               <au>
                  <snm>Sato</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Frank</snm>
                  <fnm>DW</fnm>
               </au>
            </aug>
            <source>Mol Microbiol</source>
            <pubdate>2004</pubdate>
            <volume>53</volume>
            <fpage>1279</fpage>
            <lpage>1290</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1365-2958.2004.04194.x</pubid>
                  <pubid idtype="pmpid" link="fulltext">15387809</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>The human pathogen <it>Pseudomonas aeruginosa </it>utilizes conserved virulence pathways to infect the social amoeba <it>Dictyostelium discoideum</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Pukatzki</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Kessin</snm>
                  <fnm>RH</fnm>
               </au>
               <au>
                  <snm>Mekalanos</snm>
                  <fnm>JJ</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2002</pubdate>
            <volume>99</volume>
            <fpage>3159</fpage>
            <lpage>3164</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">122489</pubid>
                  <pubid idtype="pmpid" link="fulltext">11867744</pubid>
                  <pubid idtype="doi">10.1073/pnas.052704399</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>'Ready made' virulence and 'dual use' virulence factors in pathogenic environmental fungi: the <it>Cryptococcus neoformans </it>paradigm.</p>
            </title>
            <aug>
               <au>
                  <snm>Casadevall</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Steenbergen</snm>
                  <fnm>JN</fnm>
               </au>
               <au>
                  <snm>Nosanchuk</snm>
                  <fnm>JD</fnm>
               </au>
            </aug>
            <source>Curr Opin Microbiol</source>
            <pubdate>2003</pubdate>
            <volume>6</volume>
            <fpage>332</fpage>
            <lpage>337</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S1369-5274(03)00082-1</pubid>
                  <pubid idtype="pmpid" link="fulltext">12941400</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Does amoeboid reasoning explain the evolution and maintenance of virulence factors in <it>Cryptococc