<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>gb-2008-9-12-r183</ui>
   <ji>GBJ</ji>
   <fm>
      <dochead>Research</dochead>
      <bibl>
         <title>
            <p>Comparative genomics of mutualistic viruses of <it>Glyptapanteles </it>parasitic wasps</p>
         </title>
         <aug>
            <au id="A1" ca="yes">
               <snm>Desjardins</snm>
               <mi>A</mi>
               <fnm>Christopher</fnm>
               <insr iid="I1"/>
               <insr iid="I6"/>
               <email>cdesjar3@mail.rochester.edu</email>
            </au>
            <au id="A2">
               <snm>Gundersen-Rindal</snm>
               <mi>E</mi>
               <fnm>Dawn</fnm>
               <insr iid="I2"/>
               <email>dawn.gundersen-rindal@ars.usda.gov</email>
            </au>
            <au id="A3">
               <snm>Hostetler</snm>
               <mi>B</mi>
               <fnm>Jessica</fnm>
               <insr iid="I1"/>
               <email>jessicah@jcvi.org</email>
            </au>
            <au id="A4">
               <snm>Tallon</snm>
               <mi>J</mi>
               <fnm>Luke</fnm>
               <insr iid="I1"/>
               <insr iid="I7"/>
               <email>ljtallon@som.umaryland.edu</email>
            </au>
            <au id="A5">
               <snm>Fadrosh</snm>
               <mi>W</mi>
               <fnm>Douglas</fnm>
               <insr iid="I1"/>
               <insr iid="I8"/>
               <email>dfadrosh@jcvi.org</email>
            </au>
            <au id="A6">
               <snm>Fuester</snm>
               <mi>W</mi>
               <fnm>Roger</fnm>
               <insr iid="I3"/>
               <email>roger.fuester@ars.usda.gov</email>
            </au>
            <au id="A7">
               <snm>Pedroni</snm>
               <mi>J</mi>
               <fnm>Monica</fnm>
               <insr iid="I2"/>
               <insr iid="I9"/>
               <email>mpedroni@vetmed.wsu.edu</email>
            </au>
            <au id="A8">
               <snm>Haas</snm>
               <mi>J</mi>
               <fnm>Brian</fnm>
               <insr iid="I1"/>
               <insr iid="I10"/>
               <email>bhaas@broad.mit.edu</email>
            </au>
            <au id="A9">
               <snm>Schatz</snm>
               <mi>C</mi>
               <fnm>Michael</fnm>
               <insr iid="I4"/>
               <email>mschatz@umiacs.umd.edu</email>
            </au>
            <au id="A10">
               <snm>Jones</snm>
               <mi>M</mi>
               <fnm>Kristine</fnm>
               <insr iid="I1"/>
               <insr iid="I7"/>
               <email>kjones@som.umaryland.edu</email>
            </au>
            <au id="A11">
               <snm>Crabtree</snm>
               <fnm>Jonathan</fnm>
               <insr iid="I1"/>
               <insr iid="I7"/>
               <email>crabtree@jcvi.org</email>
            </au>
            <au id="A12">
               <snm>Forberger</snm>
               <fnm>Heather</fnm>
               <insr iid="I1"/>
               <email>hcarty@jcvi.org</email>
            </au>
            <au id="A13">
               <snm>Nene</snm>
               <fnm>Vishvanath</fnm>
               <insr iid="I1"/>
               <insr iid="I5"/>
               <email>vnene@som.umaryland.edu</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>J Craig Venter Institute, Rockville, MD 20850, USA</p>
            </ins>
            <ins id="I2">
               <p>USDA-ARS Invasive Insect Biocontrol and Behavior Laboratory, Beltsville, MD 20705, USA</p>
            </ins>
            <ins id="I3">
               <p>USDA-ARS Beneficial Insect Introduction Research Laboratory, Newark, DE 19713, USA</p>
            </ins>
            <ins id="I4">
               <p>Center for Bioinformatics and Computational Biology, University of Maryland, College Park, MD 20742, USA</p>
            </ins>
            <ins id="I5">
               <p>Institute for Genome Sciences and Department of Microbiology and Immunology, University of Maryland School of Medicine, Baltimore, MD 21201, USA</p>
            </ins>
            <ins id="I6">
               <p>Current address: Department of Biology, University of Rochester, Rochester, NY 14627, USA</p>
            </ins>
            <ins id="I7">
               <p>Current address: Institute for Genome Sciences, University of Maryland School of Medicine, Baltimore, MD 21201, USA</p>
            </ins>
            <ins id="I8">
               <p>Current address: J Craig Venter Institute, La Jolla, CA 92121, USA</p>
            </ins>
            <ins id="I9">
               <p>Current address: Department of Veterinary Microbiology and Pathology, Washington State University, WA 99164, USA</p>
            </ins>
            <ins id="I10">
               <p>Current address: The Broad Institute, Cambridge, MA 02142, USA</p>
            </ins>
         </insg>
         <source>Genome Biology</source>
         <issn>1465-6906</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>12</issue>
         <fpage>R183</fpage>
         <url>http://genomebiology.com/2008/9/12/R183</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">19116010</pubid>
               <pubid idtype="doi">10.1186/gb-2008-9-12-r183</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>14</day>
               <month>7</month>
               <year>2008</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>30</day>
               <month>12</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>30</day>
               <month>12</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>Desjardins et al.; licensee BioMed Central Ltd.</collab>
         <note>This is an open access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <shorttitle>
         <p>Glyptapanteles polydnavirus genome sequences</p>
      </shorttitle>
      <shortabs>
         <p>Comparative genome analysis of two endosymbiotic polydnaviruses from Glyptapanteles parasitic wasps reveals new insights into the evolutionary arms race between host and parasite.</p>
      </shortabs>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Polydnaviruses, double-stranded DNA viruses with segmented genomes, have evolved as obligate endosymbionts of parasitoid wasps. Virus particles are replication deficient and produced by female wasps from proviral sequences integrated into the wasp genome. These particles are co-injected with eggs into caterpillar hosts, where viral gene expression facilitates parasitoid survival and, thereby, survival of proviral DNA. Here we characterize and compare the encapsidated viral genome sequences of bracoviruses in the family Polydnaviridae associated with <it>Glyptapanteles </it>gypsy moth parasitoids, along with near complete proviral sequences from which both viral genomes are derived.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>The encapsidated <it>Glyptapanteles indiensis </it>and <it>Glyptapanteles flavicoxis </it>bracoviral genomes, each composed of 29 different size segments, total approximately 517 and 594 kbp, respectively. They are generated from a minimum of seven distinct loci in the wasp genome. Annotation of these sequences revealed numerous novel features for polydnaviruses, including insect-like sugar transporter genes and transposable elements. Evolutionary analyses suggest that positive selection is widespread among bracoviral genes.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusions</p>
               </st>
               <p>The structure and organization of <it>G. indiensis </it>and <it>G. flavicoxis </it>bracovirus proviral segments as multiple loci containing one to many viral segments, flanked and separated by wasp gene-encoding DNA, is confirmed. Rapid evolution of bracovirus genes supports the hypothesis of bracovirus genes in an 'arms race' between bracovirus and caterpillar. Phylogenetic analyses of the bracoviral genes encoding sugar transporters provides the first robust evidence of a wasp origin for some polydnavirus genes. We hypothesize transposable elements, such as those described here, could facilitate transfer of genes between proviral segments and host DNA.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <meta>
      <classifications>
         <classification type="BMC" subtype="man_spc_id" id="30010008">Evolution</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010010">Genome studies</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010014">Microbiology and parasitology</classification>
         <classification type="BMC" subtype="man_spc_id" id="30010020">Virology</classification>
      </classifications>
   </meta>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The capacity to sequence and analyze complex genomes has enabled rapid progress toward understanding atypical biological systems, such as the obligate mutualistic association of polydnaviruses (PDVs) with certain parasitic wasps <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. PDVs have evolved a distinctive life strategy as they exist in two distinct forms, as a proviral form integrated into the genome of male and female parasitoids <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>, and in a virus form that is replication deficient. PDV encapsidated genomes are unlike any other viral genomes as they consist of multiple circular double-stranded DNA molecules, referred to as segments. Proviral DNA is amplified from the parasitoid genome, followed by excision, circularization, and encapsidation of segments into virus particles, and occurs only within female ovarian calyx epithelial cells <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr><abbr bid="B6">6</abbr></abbrgrp>. PDVs are also distinctive in that they require two separate hosts to maintain their life cycle. PDV virions are released into the oviduct lumen with no obvious pathology to the primary host. During oviposition, virions, wasp eggs and other parasitism-associated factors are delivered into a secondary host, usually a lepidopteran, where PDV gene expression disrupts immune functions, physiology, and development <abbrgrp><abbr bid="B7">7</abbr><abbr bid="B8">8</abbr><abbr bid="B9">9</abbr></abbrgrp>. Virion-induced pathology within the secondary host ensures survival of the PDV proviral form within the parasitoid life cycle.</p>
         <p>Genome sequencing and analyses undertaken to elucidate the genetic complement of PDVs relating to their unusual biology have focused mainly on encapsidated viral genomes as isolated from female parasitoid reproductive tracts. Comprehensive genome studies have been conducted for representative members of the two genera of PDVs, bracoviruses (BVs) and ichnoviruses (IVs), described as obligate endosymbionts of braconid and ichneumonid parasitoids, respectively. Braconid parasitoids harboring BVs are monophyletic and comprise the microgastroid complex of seven subfamilies (Cheloninae, Dirrhoponae, Mendesellinae, Khoikhoiinae, Cardiochilinae, Miracinae and Microgastrinae) with greater than 17,500 species <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>. BV genomes sequenced to date are exclusive to subfamily Microgastrinae, <it>Cotesia congregata </it>BV (CcBV) <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>, and <it>Microplitis demolitor </it>BV (MdBV) <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>; IV genomes sequenced include members from the ichneumonid subfamily Campopleginae, <it>Campolitis sonorensis </it>IV (CsIV) <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>, <it>Hyposoter fugitivus </it>IV and <it>Tranosema rostrale </it>IV <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, and from subfamily Banchinae, <it>Glypta fumiferanae </it>IV <abbrgrp><abbr bid="B14">14</abbr></abbrgrp>. General characteristics that differ in sequenced encapsidated BV and IV viral genomes include segment number, size and abundance, while similar characteristics include a low gene coding density, multiple intron-containing protein coding genes and the presence of multi-gene families <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp>.</p>
         <p>Conventional concepts in virology do not adequately describe the viral and proviral forms of PDV genomes. Encapsidated PDV genomes sequenced to date lack known viral structural proteins and DNA replication-associated enzymes, and there is evidence that in CsIV, a gene coding for one structural protein is not encoded by the encapsidated genome <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>. It has been hypothesized that PDVs have a viral ancestry and have undergone reductive genome evolution, where replication and coat protein genes have been transferred to other regions of the wasp genome <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>. Although PDVs are classified as viruses <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>, a contrasting hypothesis is that PDVs have evolved from genetic elements that have captured parasitoid genes and a virion production system <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. Here, we use the term viral genome to represent segment sequences encapsidated in virus particles and proviral segment to represent the linear integrated form of a circular viral genome segment. We conservatively describe the proviral genome to encompass all proviral segments and their excision motifs.</p>
         <p>PDV viral genome sequences have advanced our understanding of PDV-mediated pathology in parasitism and have begun to unravel evolutionary relationships of this unusual group of viruses. However, very little is known about the composition and sequence of PDV proviral genomes beyond the prediction of proviral segment sequences. Early studies based on CsIV showed that several proviral segments were flanked by genomic DNA that was not encapsidated, suggesting CsIV proviral segment sequences are dispersed in the wasp genome <abbrgrp><abbr bid="B20">20</abbr><abbr bid="B21">21</abbr><abbr bid="B22">22</abbr></abbrgrp>. In contrast, BV proviral segment sequences are thought to be located at a single locus in a tandem array <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr><abbr bid="B25">25</abbr></abbrgrp>. This hypothesis is based on both <it>in situ </it>hybridization evidence where probes from 3 of 30 different CcBV viral segments hybridized to the same region of a single wasp chromosome <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> and studies of CcBV and <it>Chelonus inanitus </it>BV (CiBV) in which proviral segments were flanked on one or both sides by a different proviral segment <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B24">24</abbr></abbrgrp>. A direct DNA sequence repeat was seen at the boundaries of the few proviral segments examined <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>, and it appears to mark the site of proviral segment excision, possibly via conservative site-specific recombination, as a single copy of the repeat was noted within the corresponding circularized viral segment <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>. A working model for BV viral segment production is that they are derived from a large precursor molecule encompassing multiple proviral segments, which is amplified after excision of the precursor from the wasp chromosome <abbrgrp><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr></abbrgrp>. Studies of CcBV and CiBV show that there is no replication of mature viral segments <abbrgrp><abbr bid="B23">23</abbr><abbr bid="B26">26</abbr><abbr bid="B27">27</abbr><abbr bid="B28">28</abbr></abbrgrp>.</p>
         <p>Recently, we presented a global examination and description of proviral segment sequences of a BV associated with <it>Glyptapanteles indiensis </it>(GiBV) <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>, a parasitoid of gypsy moth. In contrast to earlier concepts, our data showed that some but not all of approximately 24 GiBV proviral segment sequences are tandemly arrayed. We provided the first detailed analysis of a major part of a PDV proviral genome, a 223 kbp locus labeled proviral locus 1, which encodes a tandem array of 8 GiBV proviral segments separated by inter-segmental regions that varies in length from 117 to 8,369 bp <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. We also proposed that it was reasonable to consider inter-segmental DNA separating tandemly arrayed proviral segments as components of the proviral genome. Structural and compositional analyses revealed that this array of proviral segments was flanked by 6-7 kbp sequence repeats and that proviral segment sequences had a distinct nucleotide composition from inter-segmental and flanking non-segment DNA. Comparative sequence analysis revealed conserved motifs at the sites of excision of segments from proviral DNA, which suggested that there is directionality to the mechanism of segment excision, a conclusion also supported in CiBV <abbrgrp><abbr bid="B29">29</abbr></abbrgrp>. The motifs we identified are also found in other BV genomes, suggesting a highly conserved mechanism of BV proviral segment excision. Analyses of DNA polymorphisms in the eight GiBV viral segment sequences gave evidence for selection acting on both protein-coding and non-coding DNA, indicating non-coding segmental DNA may serve functional purposes <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>.</p>
         <p>Building on our previous work, we have expanded the knowledge of the BV proviral form through detailed analysis of an additional five loci encoding GiBV proviral segments. Here we revise our estimate of the GiBV viral segment number to 29, encoded by a minimum of 7 proviral loci, providing a nearly complete description of the GiBV viral genome. In addition, we provide equally extensive data showing similar characteristics of proviral segment sequences of GfBV, a BV associated with another wasp in the same genus as GiBV, <it>G. flavicoxis</it>. Comparative analyses reveal a high degree of synteny between loci that code for GiBV and GfBV proviral segments as well as flanking DNA. Not all loci are flanked by sequence repeat elements, but segment excision motifs have been conserved. Proviral segment sequences exhibit clear differences in their nucleotide composition relative to flanking DNA. GiBV and GfBV genes appear to be evolving rapidly, and GiBV and GfBV contain a novel multi-gene family that codes for sugar transporter proteins. We also identify a recent insertion of a transposable element (TE) within a population of GiBV and more ancient TEs associated with BV genomes. This work represents the most comprehensive characterization of PDV proviral genomes and of the structural organization of proviral segments to date.</p>
      </sec>
      <sec>
         <st>
            <p>Results and discussion</p>
         </st>
         <sec>
            <st>
               <p>Sequence characterization of GiBV and GfBV viral genomes</p>
            </st>
            <p>In an early study, field inversion gel analysis of the GiBV viral genome estimated the presence of 13 segments and a cumulative viral genome size of approximately 250 kbp <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. At the start of our project the viral genome characteristics of GfBV were unknown, but presumed to be similar to those of GiBV. We undertook a whole genome shotgun (WGS) sequencing approach to sequence the GiBV and GfBV viral genomes. Viral DNA was sequenced to approximately 8&#215; coverage using purified virions pooled from the calyx fluid of approximately 400 and 50 female wasps from <it>G. indiensis </it>and <it>G. flavicoxis</it>, respectively (see Materials and methods). Following a manual effort to close sequence and physical gaps, we were able to derive a complete consensus viral segment sequence for 21 GiBV viral segments (8 of which were described previously <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>); 4 segments (numbers 17, 19, 21 and 29) remained as partial sequences (Figure <figr fid="F1">1</figr>) due to technical difficulties primarily associated with sequence repeats. GiBV viral segment 25 corresponded to the GiBV genome 'segment F' previously sequenced and characterized in detail <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr></abbrgrp>. For GfBV, we were able to complete sequence analysis of 27 viral segments and 1 (number 13) remained a partial sequence (Figure <figr fid="F1">1</figr>). Nucleotide sequence polymorphisms occurred more frequently in GiBV than in GfBV, and we presume the higher sequence success rate for GfBV was due to sampling a more homogeneous viral population relative to GiBV. The discrepancy in GiBV viral genome statistics with earlier estimates <abbrgrp><abbr bid="B30">30</abbr></abbrgrp> is due to finding multiple GiBV viral segments of similar size, which would have co-migrated on the agarose gel. The 25 GiBV and 28 GfBV viral segment sequences totaled 489 kbp and 581 kbp, respectively. These aggregate genome sizes and viral segment numbers have been further revised based on proviral sequence data (described below). Individual WGS sequence reads were deposited in the NCBI Trace Archive [1643848625-1643870960, 1813616562-1813617310]. Consensus sequence for viral segments, which ranged in length from 9.7 to 39.0 kbp for GiBV and 3.8 to 50.7 kbp for GfBV have been deposited in GenBank [GenBank:<ext-link ext-link-type="gen" ext-link-id="EU001243">EU001243</ext-link>-<ext-link ext-link-type="gen" ext-link-id="EU001285">EU001285</ext-link>].</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Summary of GiBV and GfBV sequence data</p>
               </caption>
               <text>
                  <p><b>Summary of GiBV and GfBV sequence data</b>. Homologous viral segments between GiBV and GfBV are depicted in the same row and have been assigned the same number; blank spaces represent the absence of a homologous segment in one of the genomes. To the right, columns indicate the locus containing the segment and whether the segment is complete (C), partial (P), or absent (-) in the viral and proviral sequences from each genome. Incomplete sequence indicators (&lt;>) are shown only for segments for which both viral and proviral sequence are absent or incomplete.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-1"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>Sequence characterization of loci encoding GiBV and GfBV proviral segments</p>
            </st>
            <p>We previously reported that a radioactive probe from total GiBV viral DNA hybridized at varying intensity to 127 clones from a bacterial artificial chromosome (BAC) library of 9,216 clones derived from <it>G. indiensis </it>larvae; 17 GiBV viral segment sequences for which probes were available mapped to BAC clones that segregated into 7 distinct non-overlapping groups <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. A similar size BAC library from <it>G. flavicoxis </it>yielded 154 clones that hybridized with total GfBV viral DNA. A combination of BAC end sequencing of 60 BACs and 10 GfBV segment-specific PCRs also segregated these BAC clones into 7 groups. GiBV and GfBV proviral segment sequences not present in the selected BAC clones were isolated by rescreening the arrayed BAC libraries with radioactive viral segment-specific PCR products. Probes for GiBV viral segment number 29 and 30 and GfBV viral segment number 29 and 31 did not hybridize to any BAC clones, while hybridizations of a probe for GiBV segment 28 proved to be false positives. The former may be due to representational bias in the BAC libraries that were screened.</p>
            <p>A total of 11 BAC clones from <it>G. indiensis </it>(2 BAC clones were from a prior study <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>) and 9 BAC clones from <it>G. flavicoxis </it>have been sequenced. Clone selection was based on a combination of proviral segment sequence composition, BAC fingerprinting, and BAC end sequencing to try to ensure that the BAC clones chosen for sequencing contained the greatest possible coverage of proviral segment sequences. The <it>G. indiensis </it>and <it>G</it>. <it>flavicoxis </it>BAC sequence data totaled 1.21 and 1.16 Mbp, respectively. The location of proviral segments within the BAC clones was determined by sequence alignment of viral segment sequences, as well as by searching for individual segment excision motifs (see below). Overlapping BAC sequences were fused, if possible within an inter-segmental region, to create pseudo-molecule sequences reducing unique sequence data for <it>G. indiensis </it>and <it>G. flavicoxis </it>to 1.08 Mbp and 1.00 Mbp, respectively. The length of contiguous sequences ranged in size from 48.8 to 233.6 kbp for <it>G. indiensis </it>and 91.7 to 279.3 kbp for <it>G. flavicoxis</it>. Sequences were annotated as described in Materials and methods. These data have been deposited in GenBank [GenBank:<ext-link ext-link-type="gen" ext-link-id="EF710644">EF710644</ext-link>-<ext-link ext-link-type="gen" ext-link-id="EF710659">EF710659</ext-link>; <ext-link ext-link-type="gen" ext-link-id="AC191960">AC191960</ext-link>] was previously submitted <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Identification of novel GiBV and GfBV viral segments</p>
            </st>
            <p>Previously, using MEME <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>, we discovered a highly conserved 6 bp DNA sequence embedded within an approximately 60 bp motif that appears to function as the site of excision and circularization of 8 GiBV proviral segment sequences <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. The analysis of such motifs was expanded to encompass all available viral and proviral sequence data for GiBV and GfBV. Viral, 5' proviral and 3' proviral excision motifs are shown in Figure <figr fid="F2">2</figr>. There are some differences, primarily outside the hexamer repeat, between the new consensus excision motifs for GiBV and those described previously <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. Additionally, the GfBV excision motif is highly similar to that of GiBV. As we demonstrated before for GiBV, differences between the extended sequence motifs at each end of a GfBV proviral segment indicate there is directionality to the mechanism of segment excision from the site of integration.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Nucleotide conservation extends around the proviral segment excision site</p>
               </caption>
               <text>
                  <p><b>Nucleotide conservation extends around the proviral segment excision site</b>. Viral, 5' proviral, and 3' proviral motifs are shown for the GiBV and GfBV genomes, with the excision site highlighted. For each proviral motif, underlined sequence represents non-encapsidated sequence while unmarked sequence represents proviral segment sequence. Following excision, DNA is circularized at the excision site forming the viral motif.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-2"/>
            </fig>
            <p>Using the extended motifs and MAST <abbrgrp><abbr bid="B34">34</abbr></abbrgrp> we searched BAC sequences in order to detect the boundaries of proviral segment sequences for which we had partial viral segment sequence data, and we extended this search to all BACs. In addition to detecting some of the missing viral segment sequences, MAST predicted the presence of four novel proviral segments for GiBV (numbers 9, 12, 16 and 18) and one (number 8) for GfBV (Figure <figr fid="F1">1</figr>). All these potential proviral segments had exact sequence matches to unassembled sequences in the viral WGS sequence data. Sequence coverage in all cases was below one-fold and viral segment sequence versions of the novel proviral segments could not be assembled from the WGS sequence data alone. To determine whether these sequences represented potential false positives, we searched all inter-segmental and flanking non-segmental regions against the unassembled viral WGS sequence data and found no evidence for them in the WGS data. Thus, a combination of the viral and proviral sequence data predicts that GiBV and GfBV viral genomes each contain 29 segments, although 3 GiBV and 1 GfBV viral segments remain partially sequenced (Figure <figr fid="F1">1</figr>).</p>
         </sec>
         <sec>
            <st>
               <p>Loci encoding GiBV and GfBV proviral segments exhibit a high degree of synteny</p>
            </st>
            <p>Based on GiBV and GfBV proviral segment location and conservation of gene order and sequence similarity within proviral segments, 27 of the 29 proviral segments were classified into pairs of segment homologs (Figures <figr fid="F1">1</figr> and <figr fid="F3">3</figr>). Each member of a segment pair was assigned the same number. Segments 16 and 30 appear to be unique to GiBV, while segments 27 and 31 appear to be unique to GfBV (Figure <figr fid="F1">1</figr>). In addition to synteny between GiBV and GfBV proviral segments, there is clear evidence for conservation of gene order and identity of genes in wasp DNA flanking proviral segment sequences (Figure <figr fid="F3">3</figr>). These data depict the near entirety of the GiBV and GfBV proviral segments; loci encoding three GiBV and three GfBV proviral segments remain to be identified (Figure <figr fid="F1">1</figr>).</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Structural organization and synteny of proviral segments of GfBV and GiBV</p>
               </caption>
               <text>
                  <p><b>Structural organization and synteny of proviral segments of GfBV and GiBV</b>. Detailed diagrams of proviral loci for GfBV and GiBV are depicted. For each, the corresponding segment number of the encapsidated viral segment is given for each segment, with the > or &lt; symbol depicting the directionality of segment excision. Black boxes represent long tandem repeats, and three repeat classes are listed as A, B, and C. Regions of synteny between proviral segment and flanking DNA are shaded in gray. Strand-specific protein coding genes within proviral segments are depicted by green boxes, while genes encoded in flanking DNA at each locus are depicted by purple boxes. The length for each locus is shown in kbp.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-3"/>
            </fig>
            <p>The largest region encoding proviral DNA in both species is represented by two linked proviral loci, 1 and 2. GiBV proviral locus 1 <abbrgrp><abbr bid="B15">15</abbr></abbrgrp> and GfBV locus 1 consist of 8 proviral segments each, while GiBV and GfBV proviral locus 2 consists of 12 and 13 proviral segments, respectively (Table <tblr tid="T1">1</tblr>). Although the BAC clones we sequenced did not overlap at these loci, consideration of synteny suggests that they are linked (Figure <figr fid="F3">3</figr>). Synthetic oligonucleotide primers were designed near the ends of GiBV proviral segment 17 and 18 to close the existing gap between BAC clones within GiBV locus 2. However, PCR analysis of pupal stage <it>G. indiensis </it>parasitoid DNA failed, possibly due the large size of the estimated gap of approximately 20 kbp. Additional primers were designed based on an inter-segmental parasitoid sodium:neurotransmitter symporter gene present in the homologous GfBV region (Figure <figr fid="F3">3</figr>), which were then used in appropriate combination with GiBV proviral segment 17 and 18 primers. An amplicon of approximately 3 kbp (symporter to GiBV proviral segment 18) was obtained and end-sequenced (data not shown), verifying the predicted linkage. We were not able to link the large gap from GiBV proviral segment 17 to the symporter, but the data strongly support linkage of GiBV proviral segment 17 and 18 as occurs in GfBV. Synthetic oligonucleotides designed to either side of the gap separating GiBV proviral locus 1 amplified an approximately 5 kbp product and end-sequence data verified physical linkage of the two loci (data not shown). The strong syntenic relationships between GiBV and GfBV proviral genomes argue for the correct assembly and representation of GiBV proviral locus 2 and its linkage to proviral locus 1 (Figure <figr fid="F3">3</figr>).</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Summary features of loci comprising proviral segments of GiBV and GfBV</p>
               </caption>
               <tblbdy cols="13">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="12" ca="center">
                        <p>Feature</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="12">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Number of proviral segments</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Total length (inter-segmental length) in kbp*</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Number of predicted genes</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>% with signal peptides</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Median number of exons/gene</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Locus</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>PTPs</p>
                     </c>
                     <c ca="center">
                        <p>anks</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="13">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>163 (11.7)</p>
                     </c>
                     <c ca="center">
                        <p>202 (9.5)</p>
                     </c>
                     <c ca="center">
                        <p>65</p>
                     </c>
                     <c ca="center">
                        <p>71</p>
                     </c>
                     <c ca="center">
                        <p>79</p>
                     </c>
                     <c ca="center">
                        <p>89</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                     <c ca="center">
                        <p>No</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>219+ (8.9+)</p>
                     </c>
                     <c ca="center">
                        <p>252+ (20.5+)</p>
                     </c>
                     <c ca="center">
                        <p>69</p>
                     </c>
                     <c ca="center">
                        <p>73</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>Yes<sup>&#8224;</sup></p>
                     </c>
                     <c ca="center">
                        <p>Yes<sup>&#8224;</sup></p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>37 (0.3)</p>
                     </c>
                     <c ca="center">
                        <p>34 (0.3)</p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>37</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>19</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1<sup>&#8225;</sup></p>
                     </c>
                     <c ca="center">
                        <p>25</p>
                     </c>
                     <c ca="center">
                        <p>29<sup>2</sup></p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>1<sup>&#8225;</sup></p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>15<sup>2</sup></p>
                     </c>
                     <c ca="center">
                        <p>30 (0.5)</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Unknown</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>26+</p>
                     </c>
                     <c ca="center">
                        <p>22+</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>50</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                     <c ca="center">
                        <p>Yes</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="13">
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>541+</p>
                     </c>
                     <c ca="center">
                        <p>619+</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Measured from the 5' end of the first segment to the 3' end of the last segment. <sup>&#8224;</sup>Locus 2 contains a single segment with protein tyrosine phosphatases (PTPs) and two segments with ankyrins (anks). <sup>&#8225;</sup>Characteristics of regions of these loci that were not sequenced were hypothesized based on the equivalent locus in the other (GiBV or GfBV) genome.</p>
               </tblfn>
            </tbl>
            <p>The remaining GiBV and GfBV proviral loci (Table <tblr tid="T1">1</tblr>, Figure <figr fid="F3">3</figr>) contain either a single proviral segment (loci 4-6) or two proviral segments in tandem array (loci 3 and 7). Locus 6 and locus 7 sequences are only available for GiBV and GfBV, respectively, but must exist for both genomes based on viral segment sequence data (Figure <figr fid="F1">1</figr>). BAC clones containing loci 3-7 do not overlap with each other or with those encoding loci 1 and 2. The genomic context surrounding three proviral segment sequences from each virus remains unknown, and they could occur as single or tandemly linked sequences. Unless these proviral segments are linked to the loci we have already defined (in which case there would be seven loci), our current data indicate that GiBV and GfBV proviral segment sequences will occupy eight or nine loci. It remains possible that sequence analysis of the missing proviral loci may identify additional viral segment sequences.</p>
            <p>We previously described two different long (6-7 kbp) tandem repeats flanking GiBV proviral locus 1 (named L1R1 and L1R2) <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. These repeats were not found to universally flank the remaining GiBV proviral loci or to flank GfBV proviral locus 1. A long (7.5-8 kbp) tandem repeat similar to L1R1 was found in DNA adjacent to GiBV proviral loci 4 and 5 (Figure <figr fid="F3">3</figr>, A repeats) but these repeats were not found in the homologous GfBV proviral loci. An additional smaller (1 kbp) repeat similar to L1R1 was found on the 3' side of GiBV proviral locus 2. The L1R2 repeat was not found at any other GiBV proviral loci, although L1R2-like repeats (approximately 1.5 kbp) were found near GfBV proviral loci 4 and 7 (Figure <figr fid="F3">3</figr>, B repeats). GiBV proviral locus 6 does have a long (approximately 6 kbp) tandem repeat on the 3' side (Figure <figr fid="F3">3</figr>, C repeat), although it does not share sequence similarity to either L1R1 or L2R2.</p>
            <p>As found in GiBV proviral locus 1 <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>, inter-segmental regions separating tandemly arrayed proviral segments in both the GiBV and GfBV proviral genomes are generally small (&lt;1 kbp) and do not code for proteins. One exception is the approximately 9 kbp region separating GfBV proviral segments 17 and 18, which codes for a parasitoid sodium:neurotransmitter symporter. As described above, a similar host gene is likely to exist in the homologous region in <it>G. indiensis</it>.</p>
         </sec>
         <sec>
            <st>
               <p>Predicted characteristics of the GiBV and GfBV viral genomes</p>
            </st>
            <p>A summary of the major characteristics of the viral genomes of GiBV and GfBV is given in Table <tblr tid="T2">2</tblr>, and the segment sequences are visually depicted in Figure <figr fid="F1">1</figr>. These data are based on the combined sequences derived from BV viral and proviral segments, which predicts that both BV viral genomes contain 29 segments, with an aggregated genome size of approximately 503 and 594 kbp for GiBV and GfBV, respectively. GfBV viral segments are, on average, 12% larger than their homologous segment in GiBV, which appears to be due to GfBV-specific tandem duplications of gene clusters. Three GiBV and one GfBV viral segment sequence could not be finished with either viral WGS or BAC sequence data, and assuming a 12% size difference between GiBV and GfBV segment homologs, we estimate that we are missing approximately 14 kbp of GiBV and &lt;1 kbp GfBV viral genome sequence data. We thus estimate a cumulative viral genome size to be 517 kbp for GiBV and 594 kbp for GfBV.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Genome statistics of BV viral genomes</p>
               </caption>
               <tblbdy cols="5">
                  <r>
                     <c ca="left">
                        <p>Feature</p>
                     </c>
                     <c ca="center">
                        <p>GiBV</p>
                     </c>
                     <c ca="center">
                        <p>GfBV</p>
                     </c>
                     <c ca="center">
                        <p>CcBV*</p>
                     </c>
                     <c ca="center">
                        <p>MdBV<sup>&#8224;</sup></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="5">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Current genome size (kbp)</p>
                     </c>
                     <c ca="center">
                        <p>503</p>
                     </c>
                     <c ca="center">
                        <p>594</p>
                     </c>
                     <c ca="center">
                        <p>568</p>
                     </c>
                     <c ca="center">
                        <p>189</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Estimated genome size (kbp)</p>
                     </c>
                     <c ca="center">
                        <p>517</p>
                     </c>
                     <c ca="center">
                        <p>594</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Segments</p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>29</p>
                     </c>
                     <c ca="center">
                        <p>30</p>
                     </c>
                     <c ca="center">
                        <p>15</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>G+C content</p>
                     </c>
                     <c ca="center">
                        <p>36%</p>
                     </c>
                     <c ca="center">
                        <p>35%</p>
                     </c>
                     <c ca="center">
                        <p>34%</p>
                     </c>
                     <c ca="center">
                        <p>34%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Predicted genes</p>
                     </c>
                     <c ca="center">
                        <p>197</p>
                     </c>
                     <c ca="center">
                        <p>193</p>
                     </c>
                     <c ca="center">
                        <p>156</p>
                     </c>
                     <c ca="center">
                        <p>61</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Coding density</p>
                     </c>
                     <c ca="center">
                        <p>33%</p>
                     </c>
                     <c ca="center">
                        <p>32%</p>
                     </c>
                     <c ca="center">
                        <p>27%</p>
                     </c>
                     <c ca="center">
                        <p>17%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Predicted tRNAs</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Proviral loci</p>
                     </c>
                     <c ca="center">
                        <p>7-9<sup>&#8225;</sup></p>
                     </c>
                     <c ca="center">
                        <p>7-9<sup>&#8225;</sup></p>
                     </c>
                     <c ca="center">
                        <p>?</p>
                     </c>
                     <c ca="center">
                        <p>?</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>*Data from <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. <sup>&#8224;</sup>Data from <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. <sup>&#8225;</sup>While seven loci are described here, the two viral segments that were not found in the BAC sequence data are assumed to potentially represent one or two additional loci.</p>
               </tblfn>
            </tbl>
            <p>The GiBV and GfBV viral genomes are predicted to encode similar numbers of proteins, 197 versus 193, respectively, and 58% and 63%, respectively, of the genes are predicted to contain introns. Both genomes have a similar average G+C content (35-36%) and protein coding density (32-33%). The genomes contain many gene families found in other bracoviruses, including protein tyrosine phosphatases (PTPs), viral ankyrins, C-type lectins, and cystatins; features of these gene families are listed in Table <tblr tid="T3">3</tblr>. Encoded PTPs, ankyrins, and cystatins are mostly predicted to be single exon genes while C-type lectins are always predicted to be two-exon genes. PTPs and ankyrins are not predicted to encode signal peptides while C-type lectins and cystatins are often predicted to encode them. Additionally, as reported for CcBV and MdBV, the GfBV and GiBV genomes are predicted to encode a small number of tRNAs (Table <tblr tid="T2">2</tblr>).</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Features of gene families of GiBV and GfBV</p>
               </caption>
               <tblbdy cols="10">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="9" ca="center">
                        <p>Feature</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="9">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Number of copies</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Number with signal peptide</p>
                     </c>
                     <c cspan="2" ca="center">
                        <p>Number of exons</p>
                     </c>
                     <c ca="center">
                        <p>Average</p>
                     </c>
                     <c ca="center">
                        <p>M-K test</p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c cspan="2">
                        <hr/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Gene family</p>
                     </c>
                     <c ca="center">
                        <p>GiBV</p>
                     </c>
                     <c ca="center">
                        <p>GfBV</p>
                     </c>
                     <c ca="center">
                        <p>Loci</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>Gi</p>
                     </c>
                     <c ca="center">
                        <p>Gf</p>
                     </c>
                     <c ca="center">
                        <p>dN/dS (n)</p>
                     </c>
                     <c ca="center">
                        <p><it>p</it>-value</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>PTPs</p>
                     </c>
                     <c ca="center">
                        <p>42</p>
                     </c>
                     <c ca="center">
                        <p>31</p>
                     </c>
                     <c ca="center">
                        <p>2-7</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1-2</p>
                     </c>
                     <c ca="center">
                        <p>0.80 (16)</p>
                     </c>
                     <c ca="center">
                        <p>&lt;0.001</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Ankyrins</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>2-7</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>0.59 (3)</p>
                     </c>
                     <c ca="center">
                        <p>NA</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>C-type lectins</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1.09 (1)</p>
                     </c>
                     <c ca="center">
                        <p>NA</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Cystatins</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>2.23 (1)</p>
                     </c>
                     <c ca="center">
                        <p>NA</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Sugar transporters</p>
                     </c>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>6-7</p>
                     </c>
                     <c ca="center">
                        <p>7-8</p>
                     </c>
                     <c ca="center">
                        <p>0.23 (2)</p>
                     </c>
                     <c ca="center">
                        <p>NA</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>NA, not enough data for analysis.</p>
               </tblfn>
            </tbl>
            <p>A high degree of partitioning is seen between viral segment gene content when the segments are grouped by proviral locus membership (Table <tblr tid="T1">1</tblr>). The majority of genes in locus 1 are predicted to encode signal peptides, while few genes in any other loci are. Loci 1 and 2 both contain many proviral segments, most of which encode hypothetical proteins of unknown function and contain one intron. In contrast, the remaining loci contain only one or two proviral segments and predominantly encode PTPs and viral ankyrins that are not predicted to contain introns. A recent study of CiBV showed that genes on the same viral segment were generally expressed in the secondary host in the same time period <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. Since BV viral segments are present in virion DNA preparations in different abundances, the locus-specific partitioning of GiBV and GfBV proviral segments may represent some additional form of control over BV viral gene delivery.</p>
         </sec>
         <sec>
            <st>
               <p>Proviral segments and flanking regions show fundamental sequence differences</p>
            </st>
            <p>Annotation of non-encapsidated DNA sequences flanking GiBV and GfBV proviral segment sequences predicted the presence of 78 and 71 genes, respectively. Nine genes that flank GiBV proviral locus 1 were described previously <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. Very few flanking genes showed similarity to known virus (including PDV) genes; those that did are discussed below. However, many had a high sequence similarity with insect genes (78% for flanking genes and 29% for segment genes; BLASTP, E &lt; e-10). Additionally, flanking genes tended to have more exons per gene than proviral segment genes, although the difference was not statistically significant (2 &#177; 1 for segment genes and 3 &#177; 2 for flanking genes).</p>
            <p>Proviral segment and flanking DNA are distinct not only at the gene level, but on a nucleotide composition level as well. Previously, we demonstrated that for GiBV proviral locus 1, proviral segment sequences had nucleotide compositions similar to each other and distinct from flanking sequences <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. We extended the analysis of trinucleotide frequencies to encompass all available GiBV and GfBV proviral segment, flanking, and inter-segmental sequence data. The results are shown in Figure <figr fid="F4">4</figr>. The majority of proviral segment and flanking sequences cluster into distinct groups, and the short terminal-branch lengths indicate highly similar composition within these groups. Inter-segmental regions also tend to cluster together, although with a higher degree of variation, indicated by the longer terminal-branch lengths. This was expected as the generally shorter lengths of inter-segmental sequences make calculating trinucleotide frequencies less accurate. These results were consistent across both the GiBV and GfBV sequence data.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Clustering diagram of proviral segments, flanking sequences, and inter-segmental sequences by nucleotide composition</p>
               </caption>
               <text>
                  <p><b>Clustering diagram of proviral segments, flanking sequences, and inter-segmental sequences by nucleotide composition</b>. The clustering was generated using the neighbor-joining algorithm on relative trinucleotide frequences for each sequence region. Inter-segmental sequences are shown in black (unlabeled), proviral segment sequences in red, flanking sequences in green, and the GiBV TE in blue.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-4"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>GiBV and GfBV proviral segment genes are evolving rapidly</p>
            </st>
            <p>As koinobiont endoparasitoids, PDV-carrying wasps develop as larvae within caterpillars that are still undergoing development. Therefore, they are in an arms race with the caterpillars and PDVs contribute to survival against attacks by the immune system of a living caterpillar. Given this situation, it is plausible to hypothesize that PDV genes on a whole must evolve rapidly, particularly since conserved genes that typically control viral replication and particle formation appear to be absent from the viral genome. We utilized sequence divergence between GiBV and GfBV genes to test this hypothesis. All genes described here were divided into two sets: one encompassing genes encoded by proviral segments, and one including flanking genes. Genes were considered orthologs if they had reciprocal best BLAST hits to each other and appeared in syntenic positions. Using these criteria, we identified 72 orthologous gene pairs in the proviral segment gene set and 41 in the flanking gene set.</p>
            <p>In order to examine the strength and direction of selection acting on these genes, the ratio of non-synonymous to synonymous substitutions (dN/dS) was calculated and a histogram summarizing the results is shown in Figure <figr fid="F5">5</figr>. Detailed results for each gene pair are shown in Additional data file 1. Flanking wasp genes predominantly have dN/dS values near 0 (median = 0.23, average = 0.38), indicating that they are under strong negative selection, which is expected for genes involved in essential cellular processes. On the other hand, proviral segment genes have dN/dS values centered near 1 (median = 0.92, average = 0.96), suggesting that many of these genes are under neutral or positive selection. Analysis with the Mann-Whitney U test shows that, overall, segment genes are evolving at significantly different rates than flanking genes (<it>p </it>&lt; 0.001).</p>
            <fig id="F5">
               <title>
                  <p>Figure 5</p>
               </title>
               <caption>
                  <p>Histogram of dN/dS values for viral and flanking genes in GiBV and GfBV proviral sequences</p>
               </caption>
               <text>
                  <p><b>Histogram of dN/dS values for viral and flanking genes in GiBV and GfBV proviral sequences</b>. dN/dS values were calculated for 72 and 41 homologous pairs of viral genes in flanking DNA, respectively. Genes in flanking DNA have dN/dS values centered near 0 while viral genes have dN/dS values centered near 1.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-5"/>
            </fig>
            <p>An alternative explanation for the dN/dS distribution of proviral segment genes centered around 1 could be that we predicted a large number of pseudo-genes, which would be evolving neutrally; this would spike the dN/dS distribution near 1. To test this possibility and more accurately assess positive selection, we conducted a more powerful test of selection, the McDonald-Kreitman (M-K) test <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>, by comparing divergence between the 72 orthologous gene pairs to polymorphisms within those genes in the GiBV viral shotgun sequence data. Results of the test (Table <tblr tid="T4">4</tblr>) show significant evidence for positive selection across GiBV genes as a whole (<it>p </it>= 3 &#215; 10<sup>-8</sup>), indicating that most of our gene models are not false predictions and that many GiBV genes are under positive selection. Criticism of the M-K test suggests that a spurious significant result can be produced by purifying selection acting on slightly deleterious mutations within a species rather than positive selection between species <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. However, it is highly unlikely that slightly deleterious mutations alone could account for the level of significance found in this analysis.</p>
            <tbl id="T4">
               <title>
                  <p>Table 4</p>
               </title>
               <caption>
                  <p>McDonald-Kreitman test for selection</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c ca="left">
                        <p>Differences</p>
                     </c>
                     <c ca="center">
                        <p>S</p>
                     </c>
                     <c ca="center">
                        <p>N</p>
                     </c>
                     <c ca="center">
                        <p>N/S</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Polymorphic</p>
                     </c>
                     <c ca="center">
                        <p>240</p>
                     </c>
                     <c ca="center">
                        <p>319</p>
                     </c>
                     <c ca="center">
                        <p>1.33</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Fixed</p>
                     </c>
                     <c ca="center">
                        <p>1,472.5</p>
                     </c>
                     <c ca="center">
                        <p>3,262.5</p>
                     </c>
                     <c ca="center">
                        <p>2.22</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p>The number of synonymous (S) and non-synonymous (N) substitutions within GiBV (polymorphic) and between GiBV and GfBV (fixed) are shown. <it>p </it>= 3 &#215; 10<sup>-8</sup>, Fisher's exact test.</p>
               </tblfn>
            </tbl>
            <p>Closer examination of specific GiBV and GfBV gene families also revealed evidence of potential positive selection, particularly within PTPs, cystatins, and C-type lectins (Table <tblr tid="T3">3</tblr>). PTPs showed a highly significant pattern of positive selection (<it>p </it>&lt; 0.0001) using the M-K test, despite having an average dN/dS below 1. Additionally, the C-type lectin and cystatin analyzed had dN/dS ratios above 1, suggesting that these genes are also under positive selection. While it is plausible that gene families that had uniformly low dN/dS values might be involved in core viral functions such as replication or encapsidation, the only gene family found with such a dN/dS distribution was the sugar transporters (average dN/dS = 0.23). As these genes are specific to GiBV and GfBV and not found in other sequenced BVs, it seems unlikely that they serve a core viral function.</p>
            <p>In contrast to the high levels of positive selection detected within proviral segment protein coding sequences, we previously reported that, within GiBV proviral locus 1, non-coding segment DNA appeared to be under purifying selection <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. However, when the analysis was extended to include all sequence data, non-coding sites were evolving at comparable rates to synonymous sites (data not shown). This suggests that this conservation of non-coding DNA is either restricted to GiBV proviral locus 1 or that previous results were affected by limited sample size.</p>
         </sec>
         <sec>
            <st>
               <p>A wasp origin of GiBV and GfBV sugar transporter genes</p>
            </st>
            <p>Little is known about the origins of PDV genes. Genes that have sequence similarity to known eukaryotic genes, such as those encoding PTPs, are thought to have eukaryotic origins (see <abbrgrp><abbr bid="B38">38</abbr></abbrgrp> for review). However, these gene families have such diverse sequences within a single PDV genome that phylogenetic analyses have thus far been unable to determine an exact origin of these genes. Recently, in an analysis of genes from previously published BV genomes, Bezier <it>et al</it>. <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> found that no BV genes were more similar to their insect homologs than their vertebrate homologs, and phylogenetic analysis did not suggest an insect (or any other) origin for any BV genes.</p>
            <p>Annotation of two pairs of GiBV and GfBV segment homologs (segments 17 and 18) revealed a novel family of 8 genes with a surprisingly complex intron-exon structure, consisting of 6-8 exons in each gene as opposed to an average of 2 &#177; 1 exons in other viral genes. The eight genes are predicted to encode major facilitator superfamily (MFS) transporter proteins, which in general transport a wide variety of small solutes across membranes <abbrgrp><abbr bid="B40">40</abbr></abbrgrp>. The best BLASTP hits for all eight proteins were matches to predicted insect sugar transporters, particularly one from the honey bee <it>Apis mellifera </it>and one from the parasitic wasp <it>Nasonia vitripennis </it>(approximately 45% amino acid identity to both). Such genes have not been described within PDV genomes sequenced to date.</p>
            <p>Bayesian phylogenetic analysis using a GTR+gamma+I model was conducted on the 8 GiBV and GiBV sugar transporters and the 16 most similar transporters in insects. Three sugar transporters from vertebrates were chosen as outgroups, as no other arthropod sugar transporters were present in the GenBank protein database. The resulting phylogram is shown in Figure <figr fid="F6">6</figr>, with posterior probabilities given above branches. The GiBV and GfBV sugar transporters group strongly with an orthologous pair of sugar transporters from <it>Nasonia </it>and <it>Apis</it>, suggesting that these genes share a common hymenopteran ancestry. The sugar transporters did not group with that of the silk moth, <it>Bombyx mori</it>, suggesting that these genes were not acquired from the secondary host genome. The similarity of these genes to hymenopteran sugar transporters is likely not due to convergence, as if the genes were acquired from the secondary host genome, they would most likely be expressed in the caterpillar host, and therefore convergence should not drive the genes toward wasp sugar transporters. The low dN/dS values calculated for the sugar transporters (Table <tblr tid="T3">3</tblr>) suggest that they are under purifying selection. We hypothesize that this, coupled with a recent acquisition event, is why these genes still so closely resemble their ancestral wasp genes. It is unclear why the BV transporters would be under different selective pressures than other described virus gene families such as PTPs. Nevertheless, this finding provides support for the hypothesis that a large number of PDV genes have been acquired from their primary host, but have diverged to such an extent through positive selection that limited similarity remains with their ancestral wasp genes.</p>
            <fig id="F6">
               <title>
                  <p>Figure 6</p>
               </title>
               <caption>
                  <p>Bayesian phylogram of sugar transporter gene sequences from GiBV, GfBV and various insects</p>
               </caption>
               <text>
                  <p><b>Bayesian phylogram of sugar transporter gene sequences from GiBV, GfBV and various insects</b>. Mammal sugar transporters were used as an outgroup. Posterior probabilities >80% are listed above the corresponding branches, and higher taxonomic classification is shown to the right of the tree.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-6"/>
            </fig>
         </sec>
         <sec>
            <st>
               <p>A transposable element in GiBV proviral segment 11</p>
            </st>
            <p>The GiBV proviral locus 2 sequence was generated by merging sequences from overlapping BAC clones. One BAC clone contained an 11,578 bp insertion in proviral segment 11 [GenBank:<ext-link ext-link-type="gen" ext-link-id="EU822800">EU822800</ext-link>], which was not present in the other BAC clone in the region of overlap. The insertion sequence in BAC clone 1C20 is predicted to encode a single gene with sequence similarity to transposase and was bounded by a perfect 8 bp direct repeat with perfect 49 bp inverted repeats internal to the direct repeats, suggesting that the sequence is a TE. Analysis of the transposase using ProteinRepeatMask <abbrgrp><abbr bid="B41">41</abbr></abbrgrp> and CENSOR <abbrgrp><abbr bid="B42">42</abbr></abbrgrp> classified this transposase as <it>Drosophila </it>p-element-like. However, the 8 bp direct repeat (AAATTCCA) is different from that typical of p-elements (GGCCAGAC), and the TE is much larger, overall, than typical p-elements, which are only approximately 3 kbp in size. A single copy of the 8 bp direct repeat exists in BAC clone 2C5, which lacks the TE and most likely represents a point of replicative insertion for this class II transposon. The TE insertion does not disrupt a gene. Inclusion of the TE in the nucleotide composition analysis shows that the TE strongly groups with flanking sequences, rather than the segment sequence in which it is inserted (Figure <figr fid="F4">4</figr>).</p>
            <p>The TE sequence is not depicted in the proviral locus 2 sequence presented here (Figure <figr fid="F3">3</figr>) as BAC clone 2C5 contained a complete sequence of proviral segment 11 while clone 1C20 did not. In addition, the consensus sequence derived for GiBV viral segment 11 did not contain the TE. A BLAST search of the TE against the unassembled GiBV viral WGS sequence reads revealed four matching reads. These reads matched internal parts of the TE and the junction between one of the TE ends and viral segment 11, suggesting the TE is found in some GiBV viral genomes at a low frequency. We hypothesize that this TE was recently acquired from the wasp genome, and has not yet been lost or gone to fixation in the GiBV genome. If the TE was highly deleterious to the BV genome, it would be unlikely to be present in the population. While this TE does not encode any genes other than a transposase, it does suggest that TEs can enter a BV genome and become packaged successfully. No evidence of this TE was found in either viral or proviral GfBV sequence data.</p>
         </sec>
         <sec>
            <st>
               <p>CcBV-like genes are linked with GfBV proviral locus 7 and appear to be derived from <it>Maverick </it>TEs</p>
            </st>
            <p>GfBV proviral locus 7 contains proviral segment 28 and a partial sequence of proviral segment 27, and is flanked on one side by approximately 95 kbp of non-segment DNA (Figures <figr fid="F3">3</figr> and <figr fid="F7">7</figr>). The latter encodes some common TE elements (<it>Gypsy </it>retrotransposon and <it>Mariner</it>-like) and, remarkably, genes with sequence similarity to genes identified in the CcBV viral genome (Figure <figr fid="F7">7</figr>). Additionally, this region encodes a PTP gene, which is identical in nucleotide sequence to a PTP gene at the 3' end of GfBV proviral segment 28 (asterisks in Figure <figr fid="F7">7</figr>). MAST searches of this region using the GfBV proviral excision motifs did not reveal any potential excision motifs, and BLAST searches of the region against the unassembled GfBV viral sequence reads did not reveal any matching hits, suggesting that this region does not contain novel GfBV proviral segments.</p>
            <fig id="F7">
               <title>
                  <p>Figure 7</p>
               </title>
               <caption>
                  <p>Detailed view of GfBV proviral locus 7</p>
               </caption>
               <text>
                  <p><b>Detailed view of GfBV proviral locus 7</b>. Genes are labeled by strand, and genes identical in nucleotide sequences are indicated by asterisks. TE classification and CcBV homologs are shown above the genes. The directionality of segment excision is indicated by an arrowhead next to the segment number.</p>
               </text>
               <graphic file="gb-2008-9-12-r183-7"/>
            </fig>
            <p>The genes similar to those in CcBV include one that has strong sequence similarity to CcBV hypothetical protein 30.5 and a block of three genes that are homologous to, and in the same order as, CcBV segment 31 genes 31.1, 31.2, and 31.3 (Figure <figr fid="F7">7</figr>). The gene homologous to CcBV 31.1 contains a DNA Pol B2 domain, which in CcBV was annotated as a pseudogene due to a premature translational stop codon <abbrgrp><abbr bid="B11">11</abbr><abbr bid="B43">43</abbr></abbrgrp>. The second and third genes in the block contain an integrase core domain and a poxvirus-like DNA packaging domain, respectively. The CcBV genes were previously considered 'virus-like' and were hypothesized to represent ancestral virus genes within the BV genome <abbrgrp><abbr bid="B43">43</abbr></abbrgrp>.</p>
            <p>However, ProteinRepeatMasker <abbrgrp><abbr bid="B41">41</abbr></abbrgrp> and CENSOR <abbrgrp><abbr bid="B42">42</abbr></abbrgrp> identified the block of three genes and the next two downstream genes (Figure <figr fid="F7">7</figr>) as components of a <it>Maverick </it>TE. <it>Mavericks </it>are a novel class of giant TEs <abbrgrp><abbr bid="B44">44</abbr></abbrgrp>, also known as <it>Polintons </it><abbrgrp><abbr bid="B45">45</abbr></abbrgrp>. BLAST searches revealed homologs of all five genes to be common components of <it>Maverick </it>TEs present in the recently released genome sequence of the parasitic wasp <it>Nasonia vitripennis</it>. <it>Nasonia </it>belongs to a lineage of wasps separate from those carrying PDVs, suggesting that these proteins are not of BV origin. Based on these results, we hypothesize that the tandem array of three genes in CcBV segment 31 represents remnants of a <it>Maverick </it>TE that was transferred to the CcBV proviral genome and has since become fixed.</p>
            <p>The <it>Maverick</it>-like array of proteins in the GfBV flanking DNA is missing two components common to all <it>Maverick </it>TEs: a coiled-coiled domain protein and terminal repeats. The complete absence of terminal repeats coupled with the maintenance of open reading frames is particularly unusual. Since TEs cannot function without terminal repeats, TE open reading frames typically degrade rapidly after their terminal repeats are lost. This suggests that selection on the wasp genome is maintaining these open reading frames, although their potential function is unknown. The abundance of both TEs and BV-like genes encoded in DNA flanking GfBV proviral locus 7 may indicate that this region is a 'hotspot' for the movement of DNA between proviral and flanking sequences. It will be of interest to determine if similar sequences are present in the homologous GiBV locus.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>Here we provide a comprehensive sequence and computational analysis of the viral genome of BVs isolated from two different <it>Glyptapanteles </it>species, <it>G. indiensis </it>and <it>G. flavicoxis</it>, and an analysis of proviral sequences from which encapsidated viral genomes are derived. The sequencing of both BV genomic forms, that is, viral and proviral segments, was critical in developing a more complete definition of both the viral genome as well as the structural organization of a large component of the proviral genome, given that the latter unexpectedly led to the discovery of four GiBV and one GfBV viral segment not evident from sequencing the viral genome.</p>
         <p>Although GiBV and GfBV proviral segments are not all tandemly arrayed, synteny between the two sets of sequences and preliminary linkage data for GiBV suggest that approximately 70% of the 29 proviral segments in each genome are clustered in a single genomic region consisting of two proviral loci that span a region of approximately 580 kbp. Each locus contains tandemly arrayed proviral segments separated from each other by a short stretch of non-segment DNA (Figure <figr fid="F3">3</figr>). The remaining GiBV and GfBV proviral loci identified contain either one or two proviral segments. Most of the seven characterized loci are flanked by long stretches of non-segment DNA that encode insect proteins. Not every proviral locus is flanked by long tandem repeats, as was reported for proviral locus 1 <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. So it is presently unclear how proviral loci are demarcated within the wasp genome sequence. Qualitative and quantitative studies of proviral sequences at the time of production of viral segments will be needed to accurately delineate the boundaries of amplified proviral sequences. Our sequence data are not incompatible with the hypothesis that all proviral loci are linked in a macrolocus, as suggested for CcBV proviral segments <abbrgrp><abbr bid="B25">25</abbr><abbr bid="B27">27</abbr></abbrgrp>. Additional mapping experiments, for example, fluorescence <it>in situ </it>hybridization analysis using segment-specific probes or generation of a BAC tiling path among loci should resolve the spatial relationships among the GiBV and GfBV proviral loci. If present, a macrolocus encoding proviral segments would exceed 1 Mbp in size.</p>
         <p>BVs are thought to have a monophyletic origin about 100 million years ago <abbrgrp><abbr bid="B46">46</abbr></abbrgrp>, a hypothesis supported by the high degree of synteny between GiBV and GfBV proviral loci and flanking DNA, as well as the highly conserved proviral segment excision motif among BVs <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. The compositional difference in sequences at proviral loci could be indicative of independent origins of BVs, but they could also be the result of selective pressures from the primary and or secondary host environment. It will be of interest to compare proviral loci from basal micrograstrines, such as <it>Microplitis</it>, to those of more derived miscogastrines such as <it>Glyptapanteles</it>. Such comparisons could determine if there was an ancient site for BV integration and, if such a site exists, the extent to which it has been conserved. In addition, whole host genome sequence data are likely to contribute to a more complete understanding of the evolution of BVs.</p>
         <p>The functions and origins of PDV genes are often difficult to define. Comparative sequence analyses revealed widespread positive selection across a large number of GiBV and GfBV genes, which supports their role in an 'arms race' between virus and caterpillar. This rapid evolution may help to obscure the origins of many PDV genes. However, GiBV and GfBV both encode a gene family of sugar transporters not found in other sequenced PDV genomes. Phylogenetic analyses suggest that these were wasp genes that were moved into the proviral genome, providing evidence for an insect origin for these BV genes. This suggests that the proviral BV genome may be at least partially derived from the wasp genome, and possibly represents a mosaic of an ancestral virus and more recently inserted host genes.</p>
         <p>Transposable elements represent a plausible mechanism for acquiring virulence or other desirable genes from the host <abbrgrp><abbr bid="B27">27</abbr><abbr bid="B47">47</abbr></abbrgrp>. Our evidence shows a p-element like and a <it>Maverick</it>-like element associated with BV genomes. Whether the latter plays a role in BV biology is unknown, although it is interesting to note the similarities between the proposed methods of replication in <it>Mavericks </it><abbrgrp><abbr bid="B45">45</abbr></abbrgrp> and PDVs, as both are hypothesized to replicate extrachromosomally from a circular or stem-loop molecule. Both described TEs, the former recently acquired and the latter ancient, could have served to move core viral genes out of the ancestral BV genome to the host genome and virulence genes into it. Alternatively, genes could have moved out of the proviral genome by the degradation of excision motifs of proviral segments, thereby creating 'pseudo-segments' that are no longer encapsidated.</p>
      </sec>
      <sec>
         <st>
            <p>Materials and methods</p>
         </st>
         <sec>
            <st>
               <p>Rearing of parasitoid wasps</p>
            </st>
            <p>Outbred populations of <it>G. indiensis </it>and <it>G. flavicoxis</it>, solitary and gregarious endoparasitoids of gypsy moths (<it>Lymantria dispar</it>), respectively, were maintained at the USDA-ARS-Beneficial Insects Introduction Research Unit, Newark, Delaware, until they were moved to Beltsville, Maryland in 2007. The maintenance protocol and history of the <it>G. indiensis </it>colony was described previously <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. <it>G. flavicoxis </it>was reared under the same protocol with the exception that <it>G. flavicoxis </it>parasitizes late third instar gypsy moth larvae. Cocoons formed from parasitized hosts were stored at 24&#176;C until adult parasitoid emergence and then separated by sex. For BAC library material, <it>G. flavicoxis </it>larvae were dissected from parasitized gypsy moth larvae 10 days post-parasitization, briefly rinsed in phosphate buffered saline, flash frozen in liquid nitrogen and stored frozen at -80&#176;C.</p>
         </sec>
         <sec>
            <st>
               <p>Virion purification and DNA extraction</p>
            </st>
            <p>Virions were purified from <it>G. indiensis </it>and <it>G. flavicoxis </it>females using established protocols <abbrgrp><abbr bid="B48">48</abbr></abbrgrp>. Briefly, female wasps were anaesthetized in 75% ethanol and rinsed in phosphate buffered saline. Ovaries were dissected from the females in a drop of phosphate buffered saline and ruptured, draining the calyx fluid. Pooled calyx fluid was subsequently filtered through a 0.45 &#956;m filter to remove eggs and cellular debris <abbrgrp><abbr bid="B49">49</abbr></abbrgrp>. Viral DNA was extracted according to established protocols <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Identification of BAC clones containing proviral segment DNA</p>
            </st>
            <p>BAC libraries of <it>G. indiensis </it>and <it>G. flavicoxis </it>with a 120 kb average insert size were constructed by Amplicon Express (Pullman, WA, USA), using a partial <it>Bam</it>HI digest inserted into an <it>Mbo</it>I site of a pECBAC1 vector. A nylon filter arrayed with 9,216 BAC clones was created from each library. In order to identify BAC clones containing proviral segment DNA, BV encapsidated viral DNA from each was radioactively labeled with <sup>32</sup>P-labeled &#945;-dCTP (NEN/Perkin-Elmer, Waltham, MA, USA) using the Redi-prime II DNA labeling kit (Amersham Biosciences, Piscataway, NJ, USA). Labeled DNA was then purified using a QIAquick PCR purification kit (Qiagen, Valencia, CA, USA). The filter was pre-hybridized at 65&#176;C for at least 3 hours with Rapid-hyb Buffer (Amersham Biosciences) and 500 &#956;g of salmon testes DNA (denatured at 100&#176;C; Sigma-Aldritch, St. Louis, MO, USA). The probe was added and allowed to hybridize overnight at 65&#176;C. The filter was then washed 2 times for 60 minutes each at 65&#176;C with a 0.1 &#215; SSC/0.1% SDS solution, wrapped in plastic wrap, and autoradiographed using Kodac BioMax MS film.</p>
         </sec>
         <sec>
            <st>
               <p>Viral and BAC clone sequencing</p>
            </st>
            <p>Approximately 7.5 &#956;g of BV encapsidated DNA was sheared and DNA fragments in the size range 3.5-4.5 kbp purified after separation by agarose gel electrophoresis. The fragments were blunt ended and, after addition of <it>Bst</it>XI adaptors, cloned into the <it>Bst</it>XI site of pHOS2. Shotgun libraries were similarly made for each BAC clone. Celera Assembler <abbrgrp><abbr bid="B50">50</abbr></abbrgrp> and TIGR Assembler <abbrgrp><abbr bid="B51">51</abbr></abbrgrp> were used to assemble random sequence data for BV and BAC clones. Gap closure was assisted by a closure editor tool called Cloe that also permits the manual inspection and editing of sequence data. A variety of methods were used to close gaps, including re-sequencing the ends of random clones, transposon assisted sequencing (GPS, New England Biolabs&#8482;, Ipswitch, MA, USA) or 'micro-library' construction of single or pooled templates, and conversion of physical gaps to sequence gaps using 'POMP' (pipette optimal multiplex PCR) <abbrgrp><abbr bid="B52">52</abbr></abbrgrp> and or/a 'Genome Walker' kit (Invitrogen&#8482;).</p>
         </sec>
         <sec>
            <st>
               <p>Viral segment-specific PCRs and hybridizations</p>
            </st>
            <p>Primers were developed specific to individual identified GiBV and GfBV viral segment sequences as described in <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. PCR was performed in a 10 &#956;l solution that included 0.1 &#956;l template DNA, 0.3 &#956;l 50 mM MgCl<sub>2</sub>, 1 &#956;l 10&#215; PCR buffer, 0.2 &#956;l 10 mM dNTPs, 7.9 &#956;l H<sub>2</sub>O, 0.1 &#956;l Platinum Taq (Invitrogen), 0.2 &#956;l F primer (20 pm/&#956;l), and 0.2 &#956;l RC primer (20 pm/&#956;l). The PCR protocol was 94&#176; for 2 minutes; 35 cycles of 94&#176; for 30 s, 58&#176; for 30 s, 72&#176; for 45 s; followed by 72&#176; for 7 minutes. PCR products to be used for hybridizations were purified using a QIAquick PCR purification kit (Qiagen). Segment-specific hybridizations were done as described above for total viral DNA hybridizations.</p>
         </sec>
         <sec>
            <st>
               <p>Derivation of consensus segment sequences for GiBV and GfBV</p>
            </st>
            <p>Because individual sequence reads could not be associated with individual wasps, a conical consensus sequence was generated for each BV segment using the SliceTools package <abbrgrp><abbr bid="B53">53</abbr></abbrgrp>. At a given position in a conical consensus, all bases with a cumulative quality value within 50% of the highest cumulative quality value were assigned to that position.</p>
         </sec>
         <sec>
            <st>
               <p>Annotation</p>
            </st>
            <p>A combination of SoftBerry's FGENESH <abbrgrp><abbr bid="B54">54</abbr></abbrgrp> using the honey bee (<it>A. mellifera</it>) training set, and the Beijing Genome Institute's BGF <abbrgrp><abbr bid="B55">55</abbr></abbrgrp> trained on the silkmoth (<it>B. mori</it>) were used for gene prediction, in addition to the AAT package <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>, which allows spliced alignment of proteins to genomic DNA, thereby revealing potential exon-intron boundaries. Gene models from FGENESH were generally accepted except when multiple other sources of information contradicted those models. SignalP <abbrgrp><abbr bid="B57">57</abbr><abbr bid="B58">58</abbr></abbrgrp> and tRNAScan-SE <abbrgrp><abbr bid="B59">59</abbr></abbrgrp> were used to predict signal peptides and tRNAs, respectively. Transposable elements were annotated using ProteinRepeatMasker <abbrgrp><abbr bid="B41">41</abbr></abbrgrp> and CENSOR <abbrgrp><abbr bid="B42">42</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Motif analyses</p>
            </st>
            <p>Excision motifs were generated by cutting out a sequence extending 30 bp upstream and downstream from the GCT excision site at the 5' and 3' boundaries of proviral segments and at the GCT circularization site of viral segments for both GiBV and GfBV. No additional alignment was conducted on the sequences. All motifs were visualized using WebLogo <abbrgrp><abbr bid="B60">60</abbr><abbr bid="B61">61</abbr></abbrgrp>. Proviral excision motifs were also generated with these sequences using MEME <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>, and the resulting motifs were used to search BAC sequences for potential additional proviral segments using MAST <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Comparative genomic analyses</p>
            </st>
            <p>Jaccard orthologous gene clusters between GiBV and GfBV were calculated using Sybil <abbrgrp><abbr bid="B62">62</abbr></abbrgrp>. Syntenic blocks were defined as two or more adjacent orthologous gene clusters, and the results were visualized using Sybil <abbrgrp><abbr bid="B62">62</abbr></abbrgrp>. This information, in addition to conserved location (locus and position within that locus) of proviral segments, was used to define homologous segments between GiBV and GfBV.</p>
         </sec>
         <sec>
            <st>
               <p>Phylogenetic and compositional analyses</p>
            </st>
            <p>For the phylogenetic analysis, GiBV and GfBV MFS transporter genes were searched against the GenBank non-redundant protein database using BLASTP. The top 18 hits from unique organisms were downloaded from GenBank (<it>N. vitripennis</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_001607065">XP_001607065</ext-link>; <ext-link ext-link-type="gen" ext-link-id="XP_001602960">XP_001602960</ext-link>]; <it>A. mellifera</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_001120868">XP_001120868</ext-link>; <ext-link ext-link-type="gen" ext-link-id="XP_395522">XP_395522</ext-link>]; <it>Tribolium castaneum</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_973694">XP_973694</ext-link>; <ext-link ext-link-type="gen" ext-link-id="XP_973659">XP_973659</ext-link>], [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_966705">XP_966705</ext-link>; <ext-link ext-link-type="gen" ext-link-id="XP_966524">XP_966524</ext-link>]; <it>Anopheles gambiae</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_311836">XP_311836</ext-link>]; <it>Aedes egypti</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_001649205">XP_001649205</ext-link>]; <it>Drosophila melanogaster</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="NP_611451">NP_611451</ext-link>; <ext-link ext-link-type="gen" ext-link-id="NP_524479">NP_524479</ext-link>; <ext-link ext-link-type="gen" ext-link-id="CAA73031">CAA73031</ext-link>; <ext-link ext-link-type="gen" ext-link-id="XP_001361445">XP_001361445</ext-link>]; <it>Drosophila pseudoobscura</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="XP_001358762">XP_001358762</ext-link>]; <it>Mus musculus</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="NP_035525">NP_035525</ext-link>; <ext-link ext-link-type="gen" ext-link-id="CAC36405">CAC36405</ext-link>]; and <it>Rattus norvegicus</it>, [GenBank:<ext-link ext-link-type="gen" ext-link-id="NP_062103">NP_062103</ext-link>]). Additionally, the single GfBV MFS transporter gene was searched against <it>B. mori </it>expressed sequence tags in GenBank, and the single strong hit (E = e-61; [Genbank:<ext-link ext-link-type="gen" ext-link-id="BJ985900">BJ985900</ext-link>]) was downloaded from GenBank and translated. These sequences, in addition to the eight MFS transporters predicted for GiBV and GfBV, were aligned using ClustalW <abbrgrp><abbr bid="B63">63</abbr></abbrgrp>, and regions of ambiguous alignment were removed using Seaview <abbrgrp><abbr bid="B64">64</abbr></abbrgrp>, resulting in an alignment of 448 amino acids. The phylogenetic analysis was conducted using MrBayes 3.1.2 <abbrgrp><abbr bid="B65">65</abbr><abbr bid="B66">66</abbr></abbrgrp>, sampling every 1,000 generations for 1 &#215; 10<sup>7 </sup>generations. The first 50% of generations were discarded as burn-in, and posterior probabilities were calculated from the remaining 501 sampled generations.</p>
            <p>For the nucleotide composition analysis, relative trinucleotide frequencies <abbrgrp><abbr bid="B67">67</abbr></abbrgrp> were calculated for all segment, inter-segmental, and flanking sequences. A Euclidean distance matrix was then constructed from those frequencies. The sequences were then clustered using the neighbor-joining algorithm in PAUP* <abbrgrp><abbr bid="B68">68</abbr></abbrgrp> and the resulting tree was visualized with Treeview <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Molecular evolution analyses</p>
            </st>
            <p>All proteins described here for each genome were divided into two sets: those encoded by proviral segments and flanking genes. For each set, BLASTP in WU-BLAST <abbrgrp><abbr bid="B70">70</abbr></abbrgrp> was used to search the GiBV (or Gi) proteins against the GfBV (or Gf) proteins and vice versa. Nucleotide sequences of reciprocal best hit pairs that appeared in syntenic regions (in the same segment for proviral genes and in the same region for flanking genes) were aligned using the cdna_fast_pair method in T-Coffee <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>, and pairs with ambiguous or frameshifted alignments were removed. The codeml program in PAML <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp> was used to calculate dN/dS (Ka/Ks) for the remaining gene pair alignments. Pairs of proviral genes were further analyzed by using codeml in PAML <abbrgrp><abbr bid="B72">72</abbr><abbr bid="B73">73</abbr></abbrgrp> to calculate the number of silent and replacement substitutions. The number of silent and replacement polymorphisms within the GiBV shotgun sequence data for these genes with at least 3&#215; coverage were then calculated using previously described methods <abbrgrp><abbr bid="B15">15</abbr></abbrgrp>. The M-K test <abbrgrp><abbr bid="B36">36</abbr></abbrgrp> was then utilized to test gene pairs for evidence of positive or negative selection.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>BAC: bacterial artificial chromosome; BV: bracovirus; CcBV: <it>Cotesia congregata </it>bracovirus; CiBV: <it>Chelonus inanitus </it>bracovirus; CsIV: <it>Campoletis sonorensis </it>ichnovirus; dN/dS: ratio of non-synonymous to synonymous substitutions; GfBV: <it>Glyptapanteles flavicoxis </it>bracovirus; GiBV: <it>Glyptapanteles indiensis </it>bracovirus; IV: ichnovirus; MdBV: <it>Microplitis demolitor </it>bracovirus; MFS: major facilitator superfamily; M-K: McDonald-Kreitman; PDV: polydnavirus; PTP: protein tyrosine phosphatase; TE: transposable element; WGS: whole genome shotgun.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>VN and DEGR conceived the project. VN, CAD, and DEGR coordinated the project. CAD, DEGR, VN, and MJP designed and performed laboratory procedures and experiments. CAD, MCS, JC, and VN designed and performed computational analyses. CAD, VN, and DEGR wrote the manuscript. CAD and BJH conducted genome annotation. JBH, LJT, and KMJ conducted genome closure. RWF reared parasitoids. DWF and HF conducted library construction. All authors read and approved this manuscript.</p>
      </sec>
      <sec>
         <st>
            <p>Additional data files</p>
         </st>
         <p>The following additional data are available with the online version of this article. Additional data file <supplr sid="S1">1</supplr> is a table showing the molecular evolutionary analyses of GiBV and GfBV.</p>
         <suppl id="S1">
            <title>
               <p>Additional data file 1</p>
            </title>
            <caption>
               <p>Molecular evolutionary analyses of GiBV and GfBV</p>
            </caption>
            <text>
               <p>Molecular evolutionary analyses of GiBV and GfBV.</p>
            </text>
            <file name="gb-2008-9-12-r183-S1.doc">
               <p>Click here for file</p>
            </file>
         </suppl>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>We would like to thank Teresa Utterback, Tamara Feldblyum, and the staff at J Craig Venter Institute's Joint Technology Center for sequencing and viral library construction, and the JCVI IT department for general support. We would also like to thank Jessica Vamathevan and Mihai Pop for initial work on viral genome closure and analysis, Hean Koo and Jessica Chen for handling sequence submissions, Linda Hannick for help with gene family computation, and Daven Presgraves for advice on SNP analysis. Funding for this study was provided by the National Science Foundation (0413618) and United States Department of Agriculture (2004-35600-15032).</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Polydnaviridae.</p>
            </title>
            <aug>
               <au>
                  <snm>Stoltz</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Beckage</snm>
                  <fnm>NE</fnm>
               </au>
               <au>
                  <snm>Blissard</snm>
                  <fnm>GW</fnm>
               </au>
               <au>
                  <snm>Fleming</snm>
                  <fnm>JGW</fnm>
               </au>
               <au>
                  <snm>Krell</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Theilmann</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Summers</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Virus Taxonomy Sixth Report of the International Committee on Taxonomy of Viruses</source>
            <publisher>Vienna: Springer Verlag</publisher>
            <editor>Murphy FA, Fauquet CM, Bishop DHL, Ghabrial SA, Jarvis AW, Martelli GP, Mayo MA, Summers MD</editor>
            <pubdate>1995</pubdate>
            <fpage>143</fpage>
            <lpage>147</lpage>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The integration of polydnavirus genomes in parasitoid genomes: implications for biocontrol and genetic analyses of parasitoid wasps.</p>
            </title>
            <aug>
               <au>
                  <snm>Fleming</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Biol Control</source>
            <pubdate>1991</pubdate>
            <volume>1</volume>
            <fpage>127</fpage>
            <lpage>135</lpage>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Polydnavirus DNA of the braconid wasp <it>Chelonus inanitus </it>is integrated in the wasp's genome and excised only in later pupal and adult stages of the female.</p>
            </title>
            <aug>
               <au>
                  <snm>Gruber</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Stettler</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Heiniger</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Schumperli</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>1996</pubdate>
            <volume>77</volume>
            <fpage>2873</fpage>
            <lpage>2879</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">8922483</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Molecular analysis of <it>Campoletis sonorensis </it>virus DNA in the lepidopteran host <it>Heliothis virescens</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Theilmann</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Summers</snm>
                  <fnm>MD</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>1986</pubdate>
            <volume>67</volume>
            <fpage>1961</fpage>
            <lpage>1969</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">3746255</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Correlating the initiation of virus replication with a specific phase of pupal development in an ichneumonid parasitoid.</p>
            </title>
            <aug>
               <au>
                  <snm>Norton</snm>
                  <fnm>WN</fnm>
               </au>
               <au>
                  <snm>Vinson</snm>
                  <fnm>SB</fnm>
               </au>
            </aug>
            <source>Cell Tissue Res</source>
            <pubdate>1983</pubdate>
            <volume>231</volume>
            <fpage>387</fpage>
            <lpage>398</lpage>
            <xrefbib>
               <pubid idtype="pmpid">6850807</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Fate of polydnavirus DNA of the egg-larval parasitoid <it>Chelonus inanitus </it>in the host <it>Spodoptera littoralis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Wyder</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Blank</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>J Insect Physiol</source>
            <pubdate>2003</pubdate>
            <volume>49</volume>
            <fpage>491</fpage>
            <lpage>500</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12770628</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Polydnaviruses: potent mediators of host insect immune dysfunction.</p>
            </title>
            <aug>
               <au>
                  <snm>Lavine</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Beckage</snm>
                  <fnm>NE</fnm>
               </au>
            </aug>
            <source>Parasitol Today</source>
            <pubdate>1995</pubdate>
            <volume>11</volume>
            <fpage>368</fpage>
            <lpage>378</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15275399</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Hormonal interactions between insect endoparasites and their host insects.</p>
            </title>
            <aug>
               <au>
                  <snm>Lawrence</snm>
                  <fnm>PO</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Parasites and Pathogens of Insects. Parasites</source>
            <publisher>New York: Academic Press</publisher>
            <editor>Beckage NE, Thompson SN, Federici BA</editor>
            <pubdate>1993</pubdate>
            <volume>1</volume>
            <fpage>59</fpage>
            <lpage>86</lpage>
         </bibl>
         <bibl id="B9">
            <title>
               <p>The biology and genomics of polydnaviruses.</p>
            </title>
            <aug>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Strand</snm>
                  <fnm>MR</fnm>
               </au>
            </aug>
            <source>Comprehensive Molecular Insect Science</source>
            <publisher>San Diego: Elsevier</publisher>
            <editor>Gilbert LI, I I, Gill S</editor>
            <pubdate>2005</pubdate>
            <volume>6</volume>
            <fpage>323</fpage>
            <lpage>360</lpage>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Estimating the age of the polydnavirus/braconid wasp symbiosis.</p>
            </title>
            <aug>
               <au>
                  <snm>Whitfield</snm>
                  <fnm>JB</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2002</pubdate>
            <volume>99</volume>
            <fpage>7508</fpage>
            <lpage>7513</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">124262</pubid>
                  <pubid idtype="pmpid" link="fulltext">12032313</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Genome sequence of a polydnavirus: insights into symbiotic virus evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Espagne</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Huguet</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Cattolico</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Provost</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Martins</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Poirie</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Periquet</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2004</pubdate>
            <volume>306</volume>
            <fpage>286</fpage>
            <lpage>289</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15472078</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Polydnavirus genomes reflect their dual roles as mutualists and pathogens.</p>
            </title>
            <aug>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Strand</snm>
                  <fnm>MR</fnm>
               </au>
               <au>
                  <snm>Dickey</snm>
                  <fnm>SE</fnm>
               </au>
               <au>
                  <snm>Beck</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Hilgarth</snm>
                  <fnm>RS</fnm>
               </au>
               <au>
                  <snm>Barney</snm>
                  <fnm>WE</fnm>
               </au>
               <au>
                  <snm>Kadash</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kroemer</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Lindstrom</snm>
                  <fnm>KG</fnm>
               </au>
               <au>
                  <snm>Rattanadechakul</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Shelby</snm>
                  <fnm>KS</fnm>
               </au>
               <au>
                  <snm>Thoetkiattikul</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Turnbull</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Witherell</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>Virology</source>
            <pubdate>2006</pubdate>
            <volume>347</volume>
            <fpage>160</fpage>
            <lpage>174</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16380146</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Shared and species-specific features among ichnovirus genomes.</p>
            </title>
            <aug>
               <au>
                  <snm>Tanaka</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Lapointe</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Barney</snm>
                  <fnm>WE</fnm>
               </au>
               <au>
                  <snm>Makkay</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Stoltz</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Cusson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Virology</source>
            <pubdate>2007</pubdate>
            <volume>363</volume>
            <fpage>26</fpage>
            <lpage>35</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17306851</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Genomic and morphological features of a banchine polydnavirus: comparison with bracoviruses and ichnoviruses.</p>
            </title>
            <aug>
               <au>
                  <snm>Lapointe</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Tanaka</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Barney</snm>
                  <fnm>WE</fnm>
               </au>
               <au>
                  <snm>Whitfield</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Banks</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Beliveau</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Stoltz</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Cusson</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>J Virol</source>
            <pubdate>2007</pubdate>
            <volume>81</volume>
            <fpage>6491</fpage>
            <lpage>6501</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1900126</pubid>
                  <pubid idtype="pmpid" link="fulltext">17428854</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Structure and evolution of a proviral locus of <it>Glyptapanteles indiensis </it>bracovirus.</p>
            </title>
            <aug>
               <au>
                  <snm>Desjardins</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Gundersen-Rindal</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Hostetler</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Tallon</snm>
                  <fnm>LJ</fnm>
               </au>
               <au>
                  <snm>Fuester</snm>
                  <fnm>RW</fnm>
               </au>
               <au>
                  <snm>Schatz</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Pedroni</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Fadrosh</snm>
                  <fnm>DW</fnm>
               </au>
               <au>
                  <snm>Haas</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Toms</snm>
                  <fnm>BS</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Nene</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>BMC Microbiol</source>
            <pubdate>2007</pubdate>
            <volume>7</volume>
            <fpage>61</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1919376</pubid>
                  <pubid idtype="pmpid" link="fulltext">17594494</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Polydnavirus genes and genomes: emerging gene families and new insights into polydnavirus replication.</p>
            </title>
            <aug>
               <au>
                  <snm>Kroemer</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Annu Rev Entomol</source>
            <pubdate>2004</pubdate>
            <volume>49</volume>
            <fpage>431</fpage>
            <lpage>456</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">14651471</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>A gene encoding a polydnavirus structural polypeptide is not encapsidated.</p>
            </title>
            <aug>
               <au>
                  <snm>Deng</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Stoltz</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Virology</source>
            <pubdate>2000</pubdate>
            <volume>269</volume>
            <fpage>440</fpage>
            <lpage>450</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10753722</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Origin and evolution of polydnaviruses by symbiogenesis of insect DNA viruses in endoparasitic wasps.</p>
            </title>
            <aug>
               <au>
                  <snm>Federici</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Bigot</snm>
                  <fnm>Y</fnm>
               </au>
            </aug>
            <source>J Insect Physiol</source>
            <pubdate>2003</pubdate>
            <volume>49</volume>
            <fpage>419</fpage>
            <lpage>432</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12770621</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Virus or not? Phylogenetics of polydnaviruses and their wasp carriers.</p>
            </title>
            <aug>
               <au>
                  <snm>Whitfield</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Asgari</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>J Insect Physiol</source>
            <pubdate>2003</pubdate>
            <volume>49</volume>
            <fpage>397</fpage>
            <lpage>405</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12770619</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Polydnavirus DNA is integrated in the DNA of its parasitoid wasp host.</p>
            </title>
            <aug>
               <au>
                  <snm>Fleming</snm>
                  <fnm>JG</fnm>
               </au>
               <au>
                  <snm>Summers</snm>
                  <fnm>MD</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1991</pubdate>
            <volume>88</volume>
            <fpage>9770</fpage>
            <lpage>9774</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">52802</pubid>
                  <pubid idtype="pmpid" link="fulltext">1946402</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Homologous sequences in the <it>Campoletis sonorensis </it>polydnavirus genome are implicated in replication and nesting of the W segment family.</p>
            </title>
            <aug>
               <au>
                  <snm>Cui</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>J Virol</source>
            <pubdate>1997</pubdate>
            <volume>71</volume>
            <fpage>8504</fpage>
            <lpage>8513</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">192314</pubid>
                  <pubid idtype="pmpid" link="fulltext">9343208</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Characterization of <it>Campoletis sonorensis </it>ichnovirus unique segment B and excision locus structure.</p>
            </title>
            <aug>
               <au>
                  <snm>Rattanadechakul</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>J Insect Physiol</source>
            <pubdate>2003</pubdate>
            <volume>49</volume>
            <fpage>523</fpage>
            <lpage>532</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12770631</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Excision of the polydnavirus chromosomal integrated EP1 sequence of the parasitoid wasp <it>Cotesia congregata </it>(Braconidae, Microgastinae) at potential recombinase binding sites.</p>
            </title>
            <aug>
               <au>
                  <snm>Savary</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Beckage</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Periquet</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>1997</pubdate>
            <volume>78</volume>
            <fpage>3125</fpage>
            <lpage>3134</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9400960</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Characterization of <it>Chelonus inanitus </it>polydnavirus segments: sequences and analysis, excision site and demonstration of clustering.</p>
            </title>
            <aug>
               <au>
                  <snm>Wyder</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Tschannen</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hochuli</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gruber</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Saladin</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Zumbach</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2002</pubdate>
            <volume>83</volume>
            <fpage>247</fpage>
            <lpage>256</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11752722</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Visualization of polydnavirus sequences in a parasitoid wasp chromosome.</p>
            </title>
            <aug>
               <au>
                  <snm>Belle</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Beckage</snm>
                  <fnm>NE</fnm>
               </au>
               <au>
                  <snm>Rousselet</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Poirie</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lemeunier</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>J Virol</source>
            <pubdate>2002</pubdate>
            <volume>76</volume>
            <fpage>5793</fpage>
            <lpage>5796</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">137038</pubid>
                  <pubid idtype="pmpid" link="fulltext">11992007</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Polydnavirus replication: the EP1 segment of the parasitoid wasp <it>Cotesia congregata </it>is amplified within a larger precursor molecule.</p>
            </title>
            <aug>
               <au>
                  <snm>Pasquier-Barre</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Huguet</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Monteiro</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Moreau</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Poirie</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2002</pubdate>
            <volume>83</volume>
            <fpage>2035</fpage>
            <lpage>2045</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12124468</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Polydnavirus genome: integrated vs. free virus.</p>
            </title>
            <aug>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Provost</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Espagne</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Cattolico</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Poirie</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Periquet</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Huguet</snm>
                  <fnm>E</fnm>
               </au>
            </aug>
            <source>J Insect Physiol</source>
            <pubdate>2003</pubdate>
            <volume>49</volume>
            <fpage>407</fpage>
            <lpage>417</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12770620</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Ovary development and polydnavirus morphogenesis in the parasitic wasp <it>Chelonus inanitus</it>. I. Ovary morphogenesis, amplification of viral DNA and ecdysteroid titres.</p>
            </title>
            <aug>
               <au>
                  <snm>Marti</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Grossniklaus-Burgin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wyder</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wyler</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2003</pubdate>
            <volume>84</volume>
            <fpage>1141</fpage>
            <lpage>1150</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12692279</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Genome organization of the <it>Chelonus inanitus </it>polydnavirus: excision sites, spacers and abundance of proviral and excised segments.</p>
            </title>
            <aug>
               <au>
                  <snm>Annaheim</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2007</pubdate>
            <volume>88</volume>
            <fpage>450</fpage>
            <lpage>457</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17251562</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Morphological and genomic characterization of the polydnavirus associated with the parasitoid wasp <it>Glyptapanteles indiensis </it>(Hymenoptera: Braconidae).</p>
            </title>
            <aug>
               <au>
                  <snm>Chen</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Gundersen-Rindal</snm>
                  <fnm>DE</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2003</pubdate>
            <volume>84</volume>
            <fpage>2051</fpage>
            <lpage>2060</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12867635</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Evidence for integration of <it>Glyptapanteles indiensis </it>polydnavirus DNA into the chromosome of <it>Lymantria dispar in vitro</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Gundersen-Rindal</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Dougherty</snm>
                  <fnm>EM</fnm>
               </au>
            </aug>
            <source>Virus Res</source>
            <pubdate>2000</pubdate>
            <volume>66</volume>
            <fpage>27</fpage>
            <lpage>37</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10653915</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Characterization and transcriptional analysis of protein tyrosine phosphatase genes and an ankyrin repeat gene of the parasitoid <it>Glyptapanteles indiensis </it>polydnavirus in the parasitized host.</p>
            </title>
            <aug>
               <au>
                  <snm>Gundersen-Rindal</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Pedroni</snm>
                  <fnm>MJ</fnm>
               </au>
            </aug>
            <source>J Gen Virol</source>
            <pubdate>2006</pubdate>
            <volume>87</volume>
            <fpage>311</fpage>
            <lpage>322</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16432017</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Fitting a mixture model by expectation maximization to discover motifs in biopolymers.</p>
            </title>
            <aug>
               <au>
                  <snm>Bailey</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Elkan</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Proceedings of the Second International Conference on Intelligent Systems for Molecular Biology</source>
            <publisher>Menlo Park, California: AAAI Press</publisher>
            <pubdate>1994</pubdate>
            <fpage>28</fpage>
            <lpage>36</lpage>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Combining evidence using p-values: application to sequence homology searches.</p>
            </title>
            <aug>
               <au>
                  <snm>Bailey</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Gribskov</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>1998</pubdate>
            <volume>14</volume>
            <fpage>48</fpage>
            <lpage>54</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9520501</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>Transcriptional analysis of polydnaviral genes in the course of parasitization reveals segment-specific patterns.</p>
            </title>
            <aug>
               <au>
                  <snm>Weber</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Annaheim</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lanzrein</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Arch Insect Biochem Physiol</source>
            <pubdate>2007</pubdate>
            <volume>66</volume>
            <fpage>9</fpage>
            <lpage>22</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17694561</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Adaptive protein evolution at the Adh locus in <it>Drosophila</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>McDonald</snm>
                  <fnm>JH</fnm>
               </au>
               <au>
                  <snm>Kreitman</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>1991</pubdate>
            <volume>351</volume>
            <fpage>652</fpage>
            <lpage>654</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">1904993</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Looking for Darwin in all the wrong places: the misguided quest for positive selection at the nucleotide sequence level.</p>
            </title>
            <aug>
               <au>
                  <snm>Hughes</snm>
                  <fnm>AL</fnm>
               </au>
            </aug>
            <source>Heredity</source>
            <pubdate>2007</pubdate>
            <volume>99</volume>
            <fpage>364</fpage>
            <lpage>373</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17622265</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Unfolding the evolutionary story of polydnaviruses.</p>
            </title>
            <aug>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Huguet</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Virus Res</source>
            <pubdate>2006</pubdate>
            <volume>117</volume>
            <fpage>81</fpage>
            <lpage>89</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16460826</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>Bracovirus gene products are highly divergent from insect proteins.</p>
            </title>
            <aug>
               <au>
                  <snm>Bezier</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Herbiniere</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Serbielle</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Lesobre</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wincker</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Huguet</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
            </aug>
            <source>Arch Insect Biochem Physiol</source>
            <pubdate>2008</pubdate>
            <volume>67</volume>
            <fpage>172</fpage>
            <lpage>187</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18348209</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Major facilitator superfamily.</p>
            </title>
            <aug>
               <au>
                  <snm>Pao</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Paulsen</snm>
                  <fnm>IT</fnm>
               </au>
               <au>
                  <snm>Saier</snm>
                  <fnm>MH</fnm>
                  <suf>Jr</suf>
               </au>
            </aug>
            <source>Microbiol Mol Biol Rev</source>
            <pubdate>1998</pubdate>
            <volume>62</volume>
            <fpage>1</fpage>
            <lpage>34</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">98904</pubid>
                  <pubid idtype="pmpid" link="fulltext">9529885</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>RepeatMasker Open-3.0</p>
            </title>
            <url>http://www.repeatmasker.org</url>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Annotation, submission and screening of repetitive elements in Repbase: RepbaseSubmitter and Censor.</p>
            </title>
            <aug>
               <au>
                  <snm>Kohany</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Gentles</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Hankus</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Jurka</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>BMC Bioinformatics</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>474</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1634758</pubid>
                  <pubid idtype="pmpid" link="fulltext">17064419</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>The few virus-like genes of <it>Cotesia congregata </it>bracovirus.</p>
            </title>
            <aug>
               <au>
                  <snm>Drezen</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Bezier</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lesobre</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Huguet</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Cattolico</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Periquet</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Dupuy</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Arch Insect Biochem Physiol</source>
            <pubdate>2006</pubdate>
            <volume>61</volume>
            <fpage>110</fpage>
            <lpage>122</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16482582</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p><it>Mavericks</it>, a novel class of giant transposable elements widespread in eukaryotes and related to DNA viruses.</p>
            </title>
            <aug>
               <au>
                  <snm>Pritham</snm>
                  <fnm>EJ</fnm>
               </au>
               <au>
                  <snm>Putliwala</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Feschotte</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2007</pubdate>
            <volume>390</volume>
            <fpage>3</fpage>
            <lpage>17</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17034960</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Self-synthesizing DNA transposons in eukaryotes.</p>
            </title>
            <aug>
               <au>
                  <snm>Kapitonov</snm>
                  <fnm>VV</fnm>
               </au>
               <au>
                  <snm>Jurka</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>4540</fpage>
            <lpage>4545</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1450207</pubid>
                  <pubid idtype="pmpid" link="fulltext">16537396</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Phylogeny of the parasitic microgastroid subfamilies (Hymenoptera: Braconidae) based on sequence data from seven genes, with an improved time estimate of the origin of the lineage.</p>
            </title>
            <aug>
               <au>
                  <snm>Murphy</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Banks</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Whitfield</snm>
                  <fnm>JB</fnm>
               </au>
               <au>
                  <snm>Austin</snm>
                  <fnm>AD</fnm>
               </au>
            </aug>
            <source>Mol Phylogenet Evol</source>
            <pubdate>2008</pubdate>
            <volume>47</volume>
            <fpage>378</fpage>
            <lpage>395</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">18325792</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Polydnavirus biology, genome structure, and evolution.</p>
            </title>
            <aug>
               <au>
                  <snm>Webb</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>The Insect Viruses</source>
            <publisher>New York: Plenum Press</publisher>
            <editor>Miller LK, Ball LA</editor>
            <pubdate>1998</pubdate>
            <fpage>105</fpage>
            <lpage>139</lpage>
         </bibl>
         <bibl id="B48">
            <title>
               <p>Virus with a multipartite superhelical DNA genome from the Ichneumonid parasitoid <it>Campoletis sonorensis</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Krell</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Summers</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Vinson</snm>
                  <fnm>SB</fnm>
               </au>
            </aug>
            <source>J Virol</source>
            <pubdate>1982</pubdate>
            <volume>43</volume>
            <fpage>859</fpage>
            <lpage>870</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">256196</pubid>
                  <pubid idtype="pmpid" link="fulltext">16789230</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>Characterization and biological effects of <it>Cotesia congregata </it>polydnavirus on host larvae of the tobacco hornworm, <it>Manduca sexta</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Beckage</snm>
                  <fnm>NE</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>FF</fnm>
               </au>
               <au>
                  <snm>Schleifer</snm>
                  <fnm>KW</fnm>
               </au>
               <au>
                  <snm>Lane</snm>
                  <fnm>RD</fnm>
               </au>
               <au>
                  <snm>Cherubin</snm>
                  <fnm>LL</fnm>
               </au>
            </aug>
            <source>Arch Insect Biochem Physiol</source>
            <pubdate>1994</pubdate>
            <volume>26</volume>
            <fpage>165</fpage>
            <lpage>195</lpage>
         </bibl>
         <bibl id="B50">
            <title>
               <p>A whole-genome assembly of <it>Drosophila</it>.</p>
            </title>
            <aug>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>GG</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Dew</snm>
                  <fnm>IM</fnm>
               </au>
               <au>
                  <snm>Fasulo</snm>
                  <fnm>DP</fnm>
               </au>
               <au>
                  <snm>Flanigan</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Kravitz</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Mobarry</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Reinert</snm>
                  <fnm>KH</fnm>
               </au>
               <au>
                  <snm>Remington</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Anson</snm>
                  <fnm>EL</fnm>
               </au>
               <au>
                  <snm>Bolanos</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Chou</snm>
                  <fnm>HH</fnm>
               </au>
               <au>
                  <snm>Jordan</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Halpern</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Lonardi</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Beasley</snm>
                  <fnm>EM</fnm>
               </au>
               <au>
                  <snm>Brandon</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Dunn</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Lai</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Liang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Nusskern</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Zhan</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Rubin</snm>
                  <fnm>GM</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Venter</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2000</pubdate>
            <volume>287</volume>
            <fpage>2196</fpage>
            <lpage>2204</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10731133</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>TIGR Assembler: A new tool for assembling large shotgun sequencing projects.</p>
            </title>
            <aug>
               <au>
                  <snm>Sutton</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kerlavage</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Genome Sci Technol</source>
            <pubdate>1995</pubdate>
            <volume>1</volume>
            <fpage>9</fpage>
            <lpage>19</lpage>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Optimized multiplex PCR: efficiently closing a whole-genome shotgun sequencing project.</p>
            </title>
            <aug>
               <au>
                  <snm>Tettelin</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Radune</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kasif</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Khouri</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>1999</pubdate>
            <volume>62</volume>
            <fpage>500</fpage>
            <lpage>507</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10644449</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>Slice Tools</p>
            </title>
            <url>http://slicetools.sourceforge.net</url>
         </bibl>
         <bibl id="B54">
            <title>
               <p>SoftBerry - FGENESH</p>
            </title>
            <url>http://www.softberry.com</url>
         </bibl>
         <bibl id="B55">
            <title>
               <p>Beijing Gene Finder</p>
            </title>
            <url>http://bgf.genomics.org.cn</url>
         </bibl>
         <bibl id="B56">
            <title>
               <p>A tool for analyzing and annotating genomic sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Huang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Kerlavage</snm>
                  <fnm>AR</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>1997</pubdate>
            <volume>46</volume>
            <fpage>37</fpage>
            <lpage>45</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9403056</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>Identification of prokaryotic and eukaryotic signal peptides and prediction of their cleavage sites.</p>
            </title>
            <aug>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Engelbrecht</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Brunak</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>von Heijne</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>Protein Eng</source>
            <pubdate>1997</pubdate>
            <volume>10</volume>
            <fpage>1</fpage>
            <lpage>6</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9051728</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>Improved prediction of signal peptides: SignalP 3.0.</p>
            </title>
            <aug>
               <au>
                  <snm>Bendtsen</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>von Heijne</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Brunak</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>2004</pubdate>
            <volume>340</volume>
            <fpage>783</fpage>
            <lpage>795</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">15223320</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence.</p>
            </title>
            <aug>
               <au>
                  <snm>Lowe</snm>
                  <fnm>TM</fnm>
               </au>
               <au>
                  <snm>Eddy</snm>
                  <fnm>SR</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1997</pubdate>
            <volume>25</volume>
            <fpage>955</fpage>
            <lpage>964</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">146525</pubid>
                  <pubid idtype="pmpid" link="fulltext">9023104</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B60">
            <title>
               <p>WebLogo: a sequence logo generator.</p>
            </title>
            <aug>
               <au>
                  <snm>Crooks</snm>
                  <fnm>GE</fnm>
               </au>
               <au>
                  <snm>Hon</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Chandonia</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Brenner</snm>
                  <fnm>SE</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <fpage>1188</fpage>
            <lpage>1190</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">419797</pubid>
                  <pubid idtype="pmpid" link="fulltext">15173120</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B61">
            <title>
               <p>Sequence logos: a new way to display consensus sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Schneider</snm>
                  <fnm>TD</fnm>
               </au>
               <au>
                  <snm>Stephens</snm>
                  <fnm>RM</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>1990</pubdate>
            <volume>18</volume>
            <fpage>6097</fpage>
            <lpage>6100</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">332411</pubid>
                  <pubid idtype="pmpid" link="fulltext">2172928</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Sybil: methods and software for multiple genome comparison and visualization.</p>
            </title>
            <aug>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Angiuoli</snm>
                  <fnm>SV</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>White</snm>
                  <fnm>OR</fnm>
               </au>
            </aug>
            <source>Methods Mol Biol</source>
            <pubdate>2007</pubdate>
            <volume>408</volume>
            <fpage>93</fpage>
            <lpage>108</lpage>
            <xrefbib>
               <pubid idtype="pmpid">18314579</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B63">
            <title>
               <p>Multiple sequence alignment with the Clustal series of programs.</p>
            </title>
            <aug>
               <au>
                  <snm>Chenna</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sugawara</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Koike</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lopez</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Gibson</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Higgins</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Thompson</snm>
                  <fnm>JD</fnm>
               </au>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2003</pubdate>
            <volume>31</volume>
            <fpage>3497</fpage>
            <lpage>3500</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">168907</pubid>
                  <pubid idtype="pmpid" link="fulltext">12824352</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B64">
            <title>
               <p>SEAVIEW and PHYLO_WIN: two graphic tools for sequence alignment and molecular phylogeny.</p>
            </title>
            <aug>
               <au>
                  <snm>Galtier</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Gouy</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gautier</snm>
                  <fnm>C</fnm>
               </au>
            </aug>
            <source>Comput Appl Biosci</source>
            <pubdate>1996</pubdate>
            <volume>12</volume>
            <fpage>543</fpage>
            <lpage>548</lpage>
            <xrefbib>
               <pubid idtype="pmpid">9021275</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>MrBayes 3: Bayesian phylogenetic inference under mixed models.</p>
            </title>
            <aug>
               <au>
                  <snm>Ronquist</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Huelsenbeck</snm>
                  <fnm>JP</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19</volume>
            <fpage>1572</fpage>
            <lpage>1574</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12912839</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>MRBAYES: Bayesian inference of phylogenetic trees.</p>
            </title>
            <aug>
               <au>
                  <snm>Huelsenbeck</snm>
                  <fnm>JP</fnm>
               </au>
               <au>
                  <snm>Ronquist</snm>
                  <fnm>F</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2001</pubdate>
            <volume>17</volume>
            <fpage>754</fpage>
            <lpage>755</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">11524383</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B67">
            <title>
               <p>Comparisons of eukaryotic genomic sequences.</p>
            </title>
            <aug>
               <au>
                  <snm>Karlin</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ladunga</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1994</pubdate>
            <volume>91</volume>
            <fpage>12832</fpage>
            <lpage>12836</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">45534</pubid>
                  <pubid idtype="pmpid" link="fulltext">7809130</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <aug>
               <au>
                  <snm>Swofford</snm>
                  <fnm>DL</fnm>
               </au>
            </aug>
            <source>Phylogenetic Analysis Using Parsimony (*and Other Methods). Version</source>
            <publisher>Sunderland, Massachusetts: Sinauer Associates</publisher>
            <edition>4</edition>
            <pubdate>2003</pubdate>
         </bibl>
         <bibl id="B69">
            <title>
               <p>TreeView: an application to display phylogenetic trees on personal computers.</p>
            </title>
            <aug>
               <au>
                  <snm>Page</snm>
                  <fnm>RD</fnm>
               </au>
            </aug>
            <source>Comput Appl Biosci</source>
            <pubdate>1996</pubdate>
            <volume>12</volume>
            <fpage>357</fpage>
            <lpage>358</lpage>
            <xrefbib>
               <pubid idtype="pmpid">8902363</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B70">
            <title>
               <p>WU-BLAST</p>
            </title>
            <url>http://blast.wustl.edu</url>
         </bibl>
         <bibl id="B71">
            <title>
               <p>T-Coffee: A novel method for fast and accurate multiple sequence alignment.</p>
            </title>
            <aug>
               <au>
                  <snm>Notredame</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Higgins</snm>
                  <fnm>DG</fnm>
               </au>
               <au>
                  <snm>Heringa</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>2000</pubdate>
            <volume>302</volume>
            <fpage>205</fpage>
            <lpage>217</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">10964570</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <title>
               <p>PAML 4: phylogenetic analysis by maximum likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2007</pubdate>
            <volume>24</volume>
            <fpage>1586</fpage>
            <lpage>1591</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">17483113</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B73">
            <title>
               <p>PAML: a program package for phylogenetic analysis by maximum likelihood.</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Comput Appl Biosci</source>
            <pubdate>1997</pubdate>
            <volume>13</volume>
            <fpage>555</fpage>
            <lpage>556</lpage>
            <xrefbib>
               <pubid idtype="pmpid">9367129</pubid>
            </xrefbib>
         </bibl>
      </refgrp>
   </bm>
</art>
