<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-8-330</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>Gene duplication and paleopolyploidy in soybean and the implications for whole genome sequencing</p>
         </title>
         <aug>
            <au id="A1">
               <snm>Schlueter</snm>
               <mi>A</mi>
               <fnm>Jessica</fnm>
               <insr iid="I1"/>
               <email>acissej@purdue.edu</email>
            </au>
            <au id="A2">
               <snm>Lin</snm>
               <fnm>Jer-Young</fnm>
               <insr iid="I2"/>
               <email>lin51@purdue.edu</email>
            </au>
            <au id="A3">
               <snm>Schlueter</snm>
               <mi>D</mi>
               <fnm>Shannon</fnm>
               <insr iid="I1"/>
               <email>sds@purdue.edu</email>
            </au>
            <au id="A4">
               <snm>Vasylenko-Sanders</snm>
               <mi>F</mi>
               <fnm>Iryna</fnm>
               <insr iid="I3"/>
               <email>Iryna.F.Sanders-1@ou.edu</email>
            </au>
            <au id="A5">
               <snm>Deshpande</snm>
               <fnm>Shweta</fnm>
               <insr iid="I3"/>
               <email>shweta@ou.edu</email>
            </au>
            <au id="A6">
               <snm>Yi</snm>
               <fnm>Jing</fnm>
               <insr iid="I3"/>
               <email>Jing.Yi-1@ou.edu</email>
            </au>
            <au id="A7">
               <snm>O'Bleness</snm>
               <fnm>Majesta</fnm>
               <insr iid="I3"/>
               <email>stardust@ou.edu</email>
            </au>
            <au id="A8">
               <snm>Roe</snm>
               <mi>A</mi>
               <fnm>Bruce</fnm>
               <insr iid="I3"/>
               <email>broe@ou.edu</email>
            </au>
            <au id="A9">
               <snm>Nelson</snm>
               <mi>T</mi>
               <fnm>Rex</fnm>
               <insr iid="I4"/>
               <email>nelsonrt@iastate.edu</email>
            </au>
            <au id="A10">
               <snm>Scheffler</snm>
               <mi>E</mi>
               <fnm>Brian</fnm>
               <insr iid="I5"/>
               <email>bscheffler@msa-stoneville.ars.usda.gov</email>
            </au>
            <au id="A11">
               <snm>Jackson</snm>
               <mi>A</mi>
               <fnm>Scott</fnm>
               <insr iid="I1"/>
               <email>sjackson@purdue.edu</email>
            </au>
            <au id="A12" ca="yes">
               <snm>Shoemaker</snm>
               <mi>C</mi>
               <fnm>Randy</fnm>
               <insr iid="I4"/>
               <email>rcsshoe@iastate.edu</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Department of Agronomy, Purdue University, West Lafayette, IN 47907, USA</p>
            </ins>
            <ins id="I2">
               <p>Purdue Genetics Program, Purdue University, West Lafayette, IN 47907, USA</p>
            </ins>
            <ins id="I3">
               <p>Department of Chemistry and Biochemistry, University of Oklahoma, Norman, OK 73019, USA</p>
            </ins>
            <ins id="I4">
               <p>USDA-ARS, Corn Insect and Crop Genetics Research Unit, and Department of Agronomy, Iowa State University, Ames, IA 50011, USA</p>
            </ins>
            <ins id="I5">
               <p>USDA-ARS-MSA Genomics Laboratory, Stoneville, MS 38776, USA</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2007</pubdate>
         <volume>8</volume>
         <issue>1</issue>
         <fpage>330</fpage>
         <url>http://www.biomedcentral.com/1471-2164/8/330</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">17880721</pubid>
               <pubid idtype="doi">10.1186/1471-2164-8-330</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>09</day>
               <month>2</month>
               <year>2007</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>19</day>
               <month>9</month>
               <year>2007</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>19</day>
               <month>9</month>
               <year>2007</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2007</year>
         <collab>Schlueter et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Soybean, <it>Glycine max </it>(L.) Merr., is a well documented paleopolyploid. What remains relatively under characterized is the level of sequence identity in retained homeologous regions of the genome. Recently, the Department of Energy Joint Genome Institute and United States Department of Agriculture jointly announced the sequencing of the soybean genome. One of the initial concerns is to what extent sequence identity in homeologous regions would have on whole genome shotgun sequence assembly.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>Seventeen BACs representing ~2.03 Mb were sequenced as representative potential homeologous regions from the soybean genome. Genetic mapping of each BAC shows that 11 of the 20 chromosomes are represented. Sequence comparisons between homeologous BACs shows that the soybean genome is a mosaic of retained paleopolyploid regions. Some regions appear to be highly conserved while other regions have diverged significantly. Large-scale "batch" reassembly of all 17 BACs combined showed that even the most homeologous BACs with upwards of 95% sequence identity resolve into their respective homeologous sequences. Potential assembly errors were generated by tandemly duplicated pentatricopeptide repeat containing genes and long simple sequence repeats. Analysis of a whole-genome shotgun assembly of 80,000 randomly chosen JGI-DOE sequence traces reveals some new soybean-specific repeat sequences.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>This analysis investigated both the structure of the paleopolyploid soybean genome and the potential effects retained homeology will have on assembling the whole genome shotgun sequence. Based upon these results, homeologous regions similar to those characterized here will not cause major assembly issues.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>The vast majority of flowering plants likely have a polyploid origin <abbrgrp><abbr bid="B1">1</abbr><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr></abbrgrp>. The homeologous chromosomal regions resulting from these large-scale duplication events are subject to a wide range of structural changes including accumulation of indels <abbrgrp><abbr bid="B4">4</abbr><abbr bid="B5">5</abbr></abbrgrp>, illegitimate recombination <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr></abbrgrp>, gene loss, rearrangements, gene duplications and nucleotide divergence <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. In addition, they are also subject to gene conservation <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Analyses of homeologous regions in maize provids clear evidence of fractionation following duplication <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B7">7</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>. However, this is not clearly the case for cotton. An analysis of homologous regions in cotton found extensive genic and intergenic conservation with differences found only in transposable elements and small indels <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>.</p>
         <p>Soybean (<it>Glycine max </it>(L.) Merr.) was characterized early as an ancient polyploid through genetic mapping studies that identified homeologous chromosome regions based upon duplicate RFLP markers <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. In addition to mapping studies, analysis of BAC-end sequences has suggested that the retained duplicate regions of the soybean genome still share sequence homeology <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp>. Similarly, hybridization based approaches showed fairly extensive sequence identity between RFLP anchored paralogous BACs <abbrgrp><abbr bid="B17">17</abbr><abbr bid="B18">18</abbr></abbrgrp>. Approximately 275 duplicate genes were identified in the soybean EST collections and estimates of synonymous distances between gene pairs suggested that soybean has undergone at least two rounds of large-scale duplication at approximately 14 and 42 million years ago (Mya)<abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. Although the origin of the duplications giving rise to homeologous genes is difficult to determine <abbrgrp><abbr bid="B21">21</abbr></abbrgrp> it was assumed that they arose through large-scale duplication events such as polyploidy. Cytogenetic studies have shown that the 'diploid' <it>Glycine </it>have 2n = 40 chromosomes while other papilionoids have 2n = 10 or 11 suggesting at least one large-scale genome duplication <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. In addition, segmental duplications in soybean were observed using fluorescence in situ hybridization (FISH)<abbrgrp><abbr bid="B23">23</abbr></abbrgrp> and a more recent FISH analyses reveals near chromosomal-level homeology along chromosome 19 (linkage group L) and another unidentified chromosome, with only a few instances of disrupted colinearity <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>.</p>
         <p>Limited sequence comparisons have been conducted from homeologous regions of the soybean genome. Schlueter et al. <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> compared BAC sequences containing &#969;-6 fatty acid desaturase (FAD2) genes and found extensive gene conservation in both order and orientation between two BACs from homeologous regions with only one large inversion to distinguish their structures. Another study involving homeologous regions containing an N-hydroxycinnamoyl/benzoyltransferase (HCBT) gene cluster gave similar results with nucleotide identity between most genes upwards of 95% <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. These high levels of sequence identity between homeologous regions have been suggested as a potential source of error during whole genome shotgun sequence assembly in a paleopolyploid species.</p>
         <p>Recently, the DOE-JGI and the USDA jointly announced that the soybean genome was to be sequenced through a whole-genome shotgun (WGS) approach <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. Since little is known about the structure, organization, similarity and full extent of the duplications within the soybean genome, questions remain about the efficacy of a resulting assembly of these sequences. In this study, we identified, sequenced and characterized 11 BAC clones representing 5 distinct homeologous regions of the genome. In addition, 6 BACs previously characterized for homeology were included <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp> in the assembly analysis for a total of 17 BAC clones representing 7 homeologous soybean genomic regions. This collection of BACs was identified as containing genes that anchor potential homeologous regions of the genome. Duplicate genes were identified from ESTs by using TBLASTX and building contigs as previously described <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Each new "anchor gene" was chosen due to a related role in seed development of soybean. Duplicate BACs were sequenced and analyzed to determine the amount of genic homeology. In addition, the ability to distinguish homeologous sequences as will be expected for assembly of WGS was evaluated by merging sequence traces for all 17 BACs and ressemblying with varying parameters. Each assembly was evaluated against the original individual BAC assemblies. Our results indicate that the paleopolyploid soybean genome is a mosaic of homeologous sequences ranging from instances of high gene conservation to regions with extremely limited conservation. Except for tandem duplications and long simple sequence repeats, adequate nucleotide differences exist between even the most conserved homeologous regions to completely distinguish them during sequence assembly.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Duplicate soybean BACs: sequencing, assembly and homeology</p>
            </st>
            <p>Shotgun sequencing of 17 soybean BACs selected for containing retained duplicate loci yielded a total of 36,873 sequence traces and a total of 2,028,159 bp of assembled soybean genomic sequence (Table <tblr tid="T1">1</tblr>). Six BACs (768,449 bp) have previously been shown to represent homeologous regions of the soybean genome anchored by either N-hydroxycinnamoyl/benzoyltransferase genes (HCBT; gmw1-74i13 and gmw1-52d3; <abbrgrp><abbr bid="B8">8</abbr></abbrgrp> or &#969;-6 fatty acid desaturase genes (FAD2; gmw1-105h23, gmw1-15k6, gmw1-11j16, gmw1-45m6; <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. The 11 additional sequenced BACs were anchored by either RFLP clones (A711; UMb001-24d13 and Umb001-5f5) or by the duplicate transcripts cellulose synthase (gmw2-133d1 and gmw1-93l19), galactinol synthase (gmw1-5g16 and gmw1-103e11), raffinose synthase (gmw1-13o17 and gmw1-8g7) and caffeoyl-CoA O-methyltransferase (gmw1-58k3, gmw1-57d24 and gmw1-27d20). To date, this is the largest analysis of homeologous regions from the soybean genome. Although most of the BACs were sequenced to completion (phase III), seven remaining BACs contained a small number of ordered contigs with fewer than three gaps (phase II) and one BAC (gmw1-27d20) was phase I with five ordered contigs (Table <tblr tid="T1">1</tblr>).</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>General BAC information</p>
               </caption>
               <tblbdy cols="12">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>Ratio<sup>e </sup>of</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="12">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>BAC</p>
                     </c>
                     <c ca="center">
                        <p>Linkage group</p>
                     </c>
                     <c ca="center">
                        <p>Genbank accession</p>
                     </c>
                     <c ca="center">
                        <p>SNP ID<sup>b</sup></p>
                     </c>
                     <c ca="center">
                        <p>Length (bp)</p>
                     </c>
                     <c ca="center">
                        <p>Phase</p>
                     </c>
                     <c ca="center">
                        <p>Gap</p>
                     </c>
                     <c ca="center">
                        <p>ORFs<sup>c</sup></p>
                     </c>
                     <c ca="center">
                        <p>Average<sup>d </sup>EST coverage</p>
                     </c>
                     <c ca="center">
                        <p>EST- based coverage</p>
                     </c>
                     <c ca="center">
                        <p>Overall gene homeology<sup>f</sup></p>
                     </c>
                     <c ca="center">
                        <p>Gene density<sup>g</sup></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="12">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw2-133d1</p>
                     </c>
                     <c ca="center">
                        <p>F</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC158503">AC158503</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>8001</p>
                     </c>
                     <c ca="center">
                        <p>117591</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>13</p>
                     </c>
                     <c ca="center">
                        <p>32.6</p>
                     </c>
                     <c ca="center">
                        <p>38.2</p>
                     </c>
                     <c ca="center">
                        <p>3 of 13</p>
                     </c>
                     <c ca="center">
                        <p>1/9.05</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-93l19</p>
                     </c>
                     <c ca="center">
                        <p>M</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC166092">AC166092</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>51037</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>62.4</p>
                     </c>
                     <c ca="center">
                        <p>50.5</p>
                     </c>
                     <c ca="center">
                        <p>3 of 5</p>
                     </c>
                     <c ca="center">
                        <p>1/10.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-105h23</p>
                     </c>
                     <c ca="center">
                        <p>O</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC187294">AC187294</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>30491</p>
                     </c>
                     <c ca="center">
                        <p>134287</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>82.0</p>
                     </c>
                     <c ca="center">
                        <p>76.4</p>
                     </c>
                     <c ca="center">
                        <p>18 of 18</p>
                     </c>
                     <c ca="center">
                        <p>1/7.46</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-15k6</p>
                     </c>
                     <c ca="center">
                        <p>I</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC160454">AC160454</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>26051</p>
                     </c>
                     <c ca="center">
                        <p>148858</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>22</p>
                     </c>
                     <c ca="center">
                        <p>77.0</p>
                     </c>
                     <c ca="center">
                        <p>71.1</p>
                     </c>
                     <c ca="center">
                        <p>18 of 22</p>
                     </c>
                     <c ca="center">
                        <p>1/6.77</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-11j16</p>
                     </c>
                     <c ca="center">
                        <p>L</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC166091">AC166091</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>69947</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>82.2</p>
                     </c>
                     <c ca="center">
                        <p>83.0</p>
                     </c>
                     <c ca="center">
                        <p>2 of 9</p>
                     </c>
                     <c ca="center">
                        <p>1/7.77</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-45m6</p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>a</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC166742">AC166742</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>143028</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>53.6</p>
                     </c>
                     <c ca="center">
                        <p>53.0</p>
                     </c>
                     <c ca="center">
                        <p>1 of 7</p>
                     </c>
                     <c ca="center">
                        <p>1/20.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-5g16</p>
                     </c>
                     <c ca="center">
                        <p>O</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC169184">AC169184</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>115953</p>
                     </c>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>11</p>
                     </c>
                     <c ca="center">
                        <p>74.0</p>
                     </c>
                     <c ca="center">
                        <p>68.8</p>
                     </c>
                     <c ca="center">
                        <p>4 of 11</p>
                     </c>
                     <c ca="center">
                        <p>1/9.66</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-103e11</p>
                     </c>
                     <c ca="center">
                        <p>I</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC166090">AC166090</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>89397</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>12</p>
                     </c>
                     <c ca="center">
                        <p>78.6</p>
                     </c>
                     <c ca="center">
                        <p>81.3</p>
                     </c>
                     <c ca="center">
                        <p>4 of 12</p>
                     </c>
                     <c ca="center">
                        <p>1/7.45</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-58k3</p>
                     </c>
                     <c ca="center">
                        <p>O</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC185959">AC185959</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>177331</p>
                     </c>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>50.7</p>
                     </c>
                     <c ca="center">
                        <p>47.5</p>
                     </c>
                     <c ca="center">
                        <p>3 of 8</p>
                     </c>
                     <c ca="center">
                        <p>1/22.2</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-57d24</p>
                     </c>
                     <c ca="center">
                        <p>D1a</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC170860">AC170860</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>20113</p>
                     </c>
                     <c ca="center">
                        <p>162359</p>
                     </c>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>19</p>
                     </c>
                     <c ca="center">
                        <p>75.0</p>
                     </c>
                     <c ca="center">
                        <p>71.5</p>
                     </c>
                     <c ca="center">
                        <p>3 of 19</p>
                     </c>
                     <c ca="center">
                        <p>1/9.02</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-27d20</p>
                     </c>
                     <c ca="center">
                        <p>D1b</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC173959">AC173959</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>16079</p>
                     </c>
                     <c ca="center">
                        <p>227022</p>
                     </c>
                     <c ca="center">
                        <p>I</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>24</p>
                     </c>
                     <c ca="center">
                        <p>65.4</p>
                     </c>
                     <c ca="center">
                        <p>61.9</p>
                     </c>
                     <c ca="center">
                        <p>3 of 24</p>
                     </c>
                     <c ca="center">
                        <p>1/9.46</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-74i13</p>
                     </c>
                     <c ca="center">
                        <p>C1</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="DQ336954">DQ336954</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>5981</p>
                     </c>
                     <c ca="center">
                        <p>173654</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>18</p>
                     </c>
                     <c ca="center">
                        <p>68.3</p>
                     </c>
                     <c ca="center">
                        <p>70.4</p>
                     </c>
                     <c ca="center">
                        <p>13 of 18</p>
                     </c>
                     <c ca="center">
                        <p>1/9.65</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-52d3</p>
                     </c>
                     <c ca="center">
                        <p>C2</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="DQ336955">DQ336955</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>98675</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>10</p>
                     </c>
                     <c ca="center">
                        <p>59.2</p>
                     </c>
                     <c ca="center">
                        <p>62.1</p>
                     </c>
                     <c ca="center">
                        <p>9 of 10</p>
                     </c>
                     <c ca="center">
                        <p>1/9.87</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-13o17</p>
                     </c>
                     <c ca="center">
                        <p>D1a</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC196857">AC196857</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>89030</p>
                     </c>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>41.5</p>
                     </c>
                     <c ca="center">
                        <p>48.0</p>
                     </c>
                     <c ca="center">
                        <p>1 of 9</p>
                     </c>
                     <c ca="center">
                        <p>1/11.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-8g7</p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>a</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="AC196858">AC196858</ext-link>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>53292</p>
                     </c>
                     <c ca="center">
                        <p>III</p>
                     </c>
                     <c ca="center">
                        <p>0</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>32.6</p>
                     </c>
                     <c ca="center">
                        <p>30.7</p>
                     </c>
                     <c ca="center">
                        <p>1 of 4</p>
                     </c>
                     <c ca="center">
                        <p>1/13.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-24d13</p>
                     </c>
                     <c ca="center">
                        <p>E</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="DQ347960">DQ347960</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>13567</p>
                     </c>
                     <c ca="center">
                        <p>111223</p>
                     </c>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>84.0</p>
                     </c>
                     <c ca="center">
                        <p>79.3</p>
                     </c>
                     <c ca="center">
                        <p>3 of 8</p>
                     </c>
                     <c ca="center">
                        <p>1/13.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-5f5</p>
                     </c>
                     <c ca="center">
                        <p>A2</p>
                     </c>
                     <c ca="center">
                        <p>
                           <ext-link ext-link-type="gen" ext-link-id="DQ347961">DQ347961</ext-link>
                        </p>
                     </c>
                     <c ca="center">
                        <p>42937</p>
                     </c>
                     <c ca="center">
                        <p>65475</p>
                     </c>
                     <c ca="center">
                        <p>II</p>
                     </c>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>91.9</p>
                     </c>
                     <c ca="center">
                        <p>94.6</p>
                     </c>
                     <c ca="center">
                        <p>3 of 5</p>
                     </c>
                     <c ca="center">
                        <p>1/10.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Average</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>119303</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>59.1</p>
                     </c>
                     <c ca="center">
                        <p>59.05</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>1/11.1</p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a </sup>Unmappable; no polymorphic SSRs identified or any matches of CDS to SNP data</p>
                  <p><sup>b </sup>SNP Ids are taken directly from Choi et al. (2007). EST sequence from which SNP derived found in Methods and Materials.</p>
                  <p><sup>c </sup>Does not include ORFs that are alternatively spliced</p>
                  <p><sup>d </sup>An average across the BAC of the number of bp supported by an EST or cDNA divided by the total number of bp for each annotation</p>
                  <p><sup>e </sup>A ratio of the total number of bp on the BAC that are annotated divided by the total number of bases that have EST or cDNA support</p>
                  <p><sup>f </sup>Count is based upon the number of homeologs shared between BACs out of the total number of genes</p>
                  <p><sup>g </sup>Gene density is in 1 gene per &#215; number of kilobases</p>
               </tblfn>
            </tbl>
            <p>With the exception of BACs UMb001-24d13 and Umb001-5f5 that were already mapped by an RFLP marker (A711), all but two of the remaining BACs were mapped by either BLAST-based identity of predicted coding sequence (CDS) to previously mapped transcript-based single nucleotide polymorphisms (SNPs) <abbrgrp><abbr bid="B27">27</abbr></abbrgrp> or simple sequence repeats (SSRs) identified from each BAC sequence. Eight SNP markers were identified. Six of these markers confirmed already known map positions for gmw1-105h23, gmw1-15k6 <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>, gw1-74i13 <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>, UMb001-24d13, UMb001-5f5 (RFLP marker A711) and gmw2-133d1 (mapped by SSR as described below). The final two SNPs provided map positions for gmw1-57d24 and gmw1-27d20 (Table <tblr tid="T1">1</tblr>). In addition to SNPs, SSRs derived from BACs were identified, tested for polymorphisms and mapped. Only two BACs, gmw1-8g7 and gmw1-45m6 showed no polymorphisms in the mapping population or any matches to mapped transcript-based SNPs <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Although there are multiple BACs on linkage groups I and O, eleven linkage groups are represented in this analysis (Table <tblr tid="T1">1</tblr>).</p>
            <p>A total of 238 genes were predicted across the ~2.03 Mb of soybean sequence for an average gene density of 1 gene/11.1 Kb (Table <tblr tid="T1">1</tblr>) slightly less than previous estimates <abbrgrp><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp>. All gene structure predictions as well as the annotations, <it>ab initio </it>predictions and EST-based support for each structure can be viewed at the following website <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. On average, 59.06% of the predicted gene structures had either EST or cDNA based support, regardless of whether coverage was normalized for gene size (average EST coverage) or not (ratio of EST coverage; Table <tblr tid="T1">1</tblr>).</p>
            <p>Levels of gene conservation between BACs varied from being gene for gene in both order and orientation, with the exception of an eight-gene block inversion, for BACs gmw1-15k6 and gmw1-105h23 <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> to very weak homeology anchored by only a single gene (gmw1-13o17 and gmw1-8g7; Table <tblr tid="T1">1</tblr>; Figure <figr fid="F1">1</figr>). While both of these extremes were observed, more often, homeologous BACs showed mid-range homeology; i.e. approximately 25 to 50% of genes in overlapping regions are retained. In those cases, most retained homeologs had 90% or greater sequence identity (Table <tblr tid="T2">2</tblr>) with a few extremes. The average nucleotide identity between homeologs ranged from 53.7 to 97.4% with an average of 86.6% while average protein similarity ranging from 53.3 to 99.0% with an average of 88.8% (Table <tblr tid="T2">2</tblr>). It should be noted that when homeologs were also tandemly duplicated on a BAC, they were not included in these estimates due to the inability to accurately determine which gene copy was the true ancestral homeolog between BACs.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>Duplicate gene homeology/paralogy between BAC pairs</p>
               </caption>
               <tblbdy cols="10">
                  <r>
                     <c ca="left">
                        <p>BAC homeologs</p>
                     </c>
                     <c ca="center">
                        <p>Putative function</p>
                     </c>
                     <c ca="center">
                        <p># of exons</p>
                     </c>
                     <c ca="center">
                        <p>Coding length<sup>a</sup></p>
                     </c>
                     <c ca="center">
                        <p>Nucleotide identity</p>
                     </c>
                     <c ca="center">
                        <p>Protein identity</p>
                     </c>
                     <c ca="center">
                        <p>Protein similarity</p>
                     </c>
                     <c ca="center">
                        <p>Ks</p>
                     </c>
                     <c ca="center">
                        <p>Ka</p>
                     </c>
                     <c ca="center">
                        <p>Date (Mya)</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-74i13 gmw1-52d3</p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>b</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>b</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>b</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>89.8</p>
                     </c>
                     <c ca="center">
                        <p>88.0</p>
                     </c>
                     <c ca="center">
                        <p>90.7</p>
                     </c>
                     <c ca="center">
                        <p>0.1490</p>
                     </c>
                     <c ca="center">
                        <p>0.0335</p>
                     </c>
                     <c ca="center">
                        <p>12.2</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-105h23 gmw1-15k6</p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>d</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>d</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <sup>d</sup>
                        </p>
                     </c>
                     <c ca="center">
                        <p>90.7</p>
                     </c>
                     <c ca="center">
                        <p>88.9</p>
                     </c>
                     <c ca="center">
                        <p>90.4</p>
                     </c>
                     <c ca="center">
                        <p>0.1061</p>
                     </c>
                     <c ca="center">
                        <p>0.0326</p>
                     </c>
                     <c ca="center">
                        <p>8.70</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-24d13</p>
                     </c>
                     <c ca="center">
                        <p>DNA binding</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1338</p>
                     </c>
                     <c ca="center">
                        <p>92.7</p>
                     </c>
                     <c ca="center">
                        <p>88.7</p>
                     </c>
                     <c ca="center">
                        <p>92.2</p>
                     </c>
                     <c ca="center">
                        <p>0.1177</p>
                     </c>
                     <c ca="center">
                        <p>0.0468</p>
                     </c>
                     <c ca="center">
                        <p>9.65</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-5f5</p>
                     </c>
                     <c ca="center">
                        <p>DNA binding</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>1473</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-24d13</p>
                     </c>
                     <c ca="center">
                        <p>Gamma response I</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>987</p>
                     </c>
                     <c ca="center">
                        <p>95.9</p>
                     </c>
                     <c ca="center">
                        <p>95.7</p>
                     </c>
                     <c ca="center">
                        <p>96.3</p>
                     </c>
                     <c ca="center">
                        <p>0.1405</p>
                     </c>
                     <c ca="center">
                        <p>0.0152</p>
                     </c>
                     <c ca="center">
                        <p>11.52</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-5f5</p>
                     </c>
                     <c ca="center">
                        <p>Gamma response I</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>984</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-24d13</p>
                     </c>
                     <c ca="center">
                        <p>Selenium binding</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>1881</p>
                     </c>
                     <c ca="center">
                        <p>56.3</p>
                     </c>
                     <c ca="center">
                        <p>54.6</p>
                     </c>
                     <c ca="center">
                        <p>56.4</p>
                     </c>
                     <c ca="center">
                        <p>0.1709</p>
                     </c>
                     <c ca="center">
                        <p>0.0575</p>
                     </c>
                     <c ca="center">
                        <p>14.01</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>UMb001-5f5</p>
                     </c>
                     <c ca="center">
                        <p>Selenium binding</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>585</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-103e11</p>
                     </c>
                     <c ca="center">
                        <p><it>A. thaliana</it>-like NAP</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>510</p>
                     </c>
                     <c ca="center">
                        <p>96.4</p>
                     </c>
                     <c ca="center">
                        <p>95.8</p>
                     </c>
                     <c ca="center">
                        <p>97.2</p>
                     </c>
                     <c ca="center">
                        <p>0.0933</p>
                     </c>
                     <c ca="center">
                        <p>0.0188</p>
                     </c>
                     <c ca="center">
                        <p>7.65</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-5g16</p>
                     </c>
                     <c ca="center">
                        <p><it>A. thaliana</it>-like NAP</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>1002</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-103e11</p>
                     </c>
                     <c ca="center">
                        <p>Beta-fructofuranosidase</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1944</p>
                     </c>
                     <c ca="center">
                        <p>94.4</p>
                     </c>
                     <c ca="center">
                        <p>92.7</p>
                     </c>
                     <c ca="center">
                        <p>94.1</p>
                     </c>
                     <c ca="center">
                        <p>0.0716</p>
                     </c>
                     <c ca="center">
                        <p>0.0276</p>
                     </c>
                     <c ca="center">
                        <p>5.87</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-5g16</p>
                     </c>
                     <c ca="center">
                        <p>Beta-fructofuranosidase</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1956</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-103e11</p>
                     </c>
                     <c ca="center">
                        <p>Galactinol synthase</p>
                     </c>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>732</p>
                     </c>
                     <c ca="center">
                        <p>90.5</p>
                     </c>
                     <c ca="center">
                        <p>93.5</p>
                     </c>
                     <c ca="center">
                        <p>94.7</p>
                     </c>
                     <c ca="center">
                        <p>0.3208</p>
                     </c>
                     <c ca="center">
                        <p>0.0316</p>
                     </c>
                     <c ca="center">
                        <p>26.30</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-5g16</p>
                     </c>
                     <c ca="center">
                        <p>Galactinol synthase</p>
                     </c>
                     <c ca="center">
                        <p>3/4</p>
                     </c>
                     <c ca="center">
                        <p>669/987</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-103e11</p>
                     </c>
                     <c ca="center">
                        <p>RAD-like protein</p>
                     </c>
                     <c ca="center">
                        <p>6/7</p>
                     </c>
                     <c ca="center">
                        <p>564/900</p>
                     </c>
                     <c ca="center">
                        <p>96.9</p>
                     </c>
                     <c ca="center">
                        <p>92.9</p>
                     </c>
                     <c ca="center">
                        <p>97.6</p>
                     </c>
                     <c ca="center">
                        <p>0.0432</p>
                     </c>
                     <c ca="center">
                        <p>0.0442</p>
                     </c>
                     <c ca="center">
                        <p>3.54</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-5g16</p>
                     </c>
                     <c ca="center">
                        <p>RAD-like protein</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>240</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw2-133d1</p>
                     </c>
                     <c ca="center">
                        <p>GTPase</p>
                     </c>
                     <c ca="center">
                        <p>14</p>
                     </c>
                     <c ca="center">
                        <p>3183</p>
                     </c>
                     <c ca="center">
                        <p>96.9</p>
                     </c>
                     <c ca="center">
                        <p>98.1</p>
                     </c>
                     <c ca="center">
                        <p>99.1</p>
                     </c>
                     <c ca="center">
                        <p>0.1055</p>
                     </c>
                     <c ca="center">
                        <p>0.0084</p>
                     </c>
                     <c ca="center">
                        <p>8.65</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-93l19</p>
                     </c>
                     <c ca="center">
                        <p>GTPase</p>
                     </c>
                     <c ca="center">
                        <p>16</p>
                     </c>
                     <c ca="center">
                        <p>3480</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw2-133d1</p>
                     </c>
                     <c ca="center">
                        <p>Cellulose synthase</p>
                     </c>
                     <c ca="center">
                        <p>9</p>
                     </c>
                     <c ca="center">
                        <p>2211</p>
                     </c>
                     <c ca="center">
                        <p>67.6</p>
                     </c>
                     <c ca="center">
                        <p>65.1</p>
                     </c>
                     <c ca="center">
                        <p>67.0</p>
                     </c>
                     <c ca="center">
                        <p>0.1109</p>
                     </c>
                     <c ca="center">
                        <p>0.0438</p>
                     </c>
                     <c ca="center">
                        <p>9.09</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-93l19</p>
                     </c>
                     <c ca="center">
                        <p>Cellulose synthase</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>924</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw2-133d1</p>
                     </c>
                     <c ca="center">
                        <p>Chain A protein</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1608</p>
                     </c>
                     <c ca="center">
                        <p>81.1</p>
                     </c>
                     <c ca="center">
                        <p>76.4</p>
                     </c>
                     <c ca="center">
                        <p>80.1</p>
                     </c>
                     <c ca="center">
                        <p>0.1856</p>
                     </c>
                     <c ca="center">
                        <p>0.077</p>
                     </c>
                     <c ca="center">
                        <p>15.21</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-93l19</p>
                     </c>
                     <c ca="center">
                        <p>Chain A protein</p>
                     </c>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>1452</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-13o17</p>
                     </c>
                     <c ca="center">
                        <p>Raffinose synthase</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>2277</p>
                     </c>
                     <c ca="center">
                        <p>66.4</p>
                     </c>
                     <c ca="center">
                        <p>71.5</p>
                     </c>
                     <c ca="center">
                        <p>81.5</p>
                     </c>
                     <c ca="center">
                        <p>2.5495</p>
                     </c>
                     <c ca="center">
                        <p>0.2051</p>
                     </c>
                     <c ca="center">
                        <p>208.98</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-8g7</p>
                     </c>
                     <c ca="center">
                        <p>Raffinose synthase</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>2190</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-57d24</p>
                     </c>
                     <c ca="center">
                        <p>Phospholipase C</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>1308</p>
                     </c>
                     <c ca="center">
                        <p>80.5</p>
                     </c>
                     <c ca="center">
                        <p>78.7</p>
                     </c>
                     <c ca="center">
                        <p>87.6</p>
                     </c>
                     <c ca="center">
                        <p>0.5457</p>
                     </c>
                     <c ca="center">
                        <p>0.114</p>
                     </c>
                     <c ca="center">
                        <p>44.73</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-58k3</p>
                     </c>
                     <c ca="center">
                        <p>Phospholipase C</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>1299</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-57d24</p>
                     </c>
                     <c ca="center">
                        <p>COMT</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>747</p>
                     </c>
                     <c ca="center">
                        <p>79.7</p>
                     </c>
                     <c ca="center">
                        <p>79.0</p>
                     </c>
                     <c ca="center">
                        <p>88.3</p>
                     </c>
                     <c ca="center">
                        <p>0.6442</p>
                     </c>
                     <c ca="center">
                        <p>0.1204</p>
                     </c>
                     <c ca="center">
                        <p>52.80</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-58k3</p>
                     </c>
                     <c ca="center">
                        <p>COMT</p>
                     </c>
                     <c ca="center">
                        <p>4/5</p>
                     </c>
                     <c ca="center">
                        <p>615/354</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-58k3</p>
                     </c>
                     <c ca="center">
                        <p>COMT</p>
                     </c>
                     <c ca="center">
                        <p>4/5</p>
                     </c>
                     <c ca="center">
                        <p>615/354</p>
                     </c>
                     <c ca="center">
                        <p>73.6</p>
                     </c>
                     <c ca="center">
                        <p>76.3</p>
                     </c>
                     <c ca="center">
                        <p>87.7</p>
                     </c>
                     <c ca="center">
                        <p>1.7076</p>
                     </c>
                     <c ca="center">
                        <p>0.1667</p>
                     </c>
                     <c ca="center">
                        <p>139.97</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-27d20</p>
                     </c>
                     <c ca="center">
                        <p>COMT</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>744</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-58k3</p>
                     </c>
                     <c ca="center">
                        <p>Otubain</p>
                     </c>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>1992</p>
                     </c>
                     <c ca="center">
                        <p>53.7</p>
                     </c>
                     <c ca="center">
                        <p>42.5</p>
                     </c>
                     <c ca="center">
                        <p>53.3</p>
                     </c>
                     <c ca="center">
                        <p>4.024</p>
                     </c>
                     <c ca="center">
                        <p>0.3023</p>
                     </c>
                     <c ca="center">
                        <p>329.84</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-27d20</p>
                     </c>
                     <c ca="center">
                        <p>Otubain</p>
                     </c>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>1860</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-57d24</p>
                     </c>
                     <c ca="center">
                        <p>CBS</p>
                     </c>
                     <c ca="center">
                        <p>6/8</p>
                     </c>
                     <c ca="center">
                        <p>399/687</p>
                     </c>
                     <c ca="center">
                        <p>74.9</p>
                     </c>
                     <c ca="center">
                        <p>73.7</p>
                     </c>
                     <c ca="center">
                        <p>89.5</p>
                     </c>
                     <c ca="center">
                        <p>2.0095</p>
                     </c>
                     <c ca="center">
                        <p>0.1562</p>
                     </c>
                     <c ca="center">
                        <p>164.71</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-27d20</p>
                     </c>
                     <c ca="center">
                        <p>CBS</p>
                     </c>
                     <c ca="center">
                        <p>8</p>
                     </c>
                     <c ca="center">
                        <p>678</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-57d24</p>
                     </c>
                     <c ca="center">
                        <p>COMT</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>747</p>
                     </c>
                     <c ca="center">
                        <p>74.1</p>
                     </c>
                     <c ca="center">
                        <p>81.6</p>
                     </c>
                     <c ca="center">
                        <p>91.0</p>
                     </c>
                     <c ca="center">
                        <p>1.5875</p>
                     </c>
                     <c ca="center">
                        <p>0.1196</p>
                     </c>
                     <c ca="center">
                        <p>130.12</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>gmw1-27d20</p>
                     </c>
                     <c ca="center">
                        <p>COMT</p>
                     </c>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>744</p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
                  <r>
                     <c cspan="10">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>Average</b>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>86.6</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>85.4</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>88.8</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>0.4239</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>0.0577</it>
                           </b>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <b>
                              <it>34.75</it>
                           </b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <it>Recalculated average 1</it>
                           <sup>d</sup>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <it>89.8</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>88.2</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>90.1</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.1179</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.0341</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>9.665</it>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <it>Recalculated average 2</it>
                           <sup>e</sup>
                        </p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c ca="center">
                        <p>
                           <it>71.8</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>71.9</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>82.7</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>1.8668</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>0.1691</it>
                        </p>
                     </c>
                     <c ca="center">
                        <p>
                           <it>153</it>
                        </p>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a </sup>Coding length in base pairs based upon CDS (from start to stop not including introns).</p>
                  <p><sup>b </sup>The values for homeologs between gmw1-74i13 and gmw1-52d3 are previously reported (Schlueter et al. 2006). Identity, similarity, Ks, Ka and Dates shown are average across BACs.</p>
                  <p><sup>c </sup>The values for homeologs between gmw1-105h23 and gmw1-15k6 are previously reported (Schlueter et al. 2007). Identity, similarity, Ks, Ka and Dates shown are average across BACs.</p>
                  <p><sup>d </sup>Recalculated average not including the highly divergent homeologs from gmw1-13o17, gmw1-8g7, gmw1-57d24, gmw1-58k3 and gmw1-27d20.</p>
                  <p><sup>e </sup>Recalculated average for just the highly divergent homeologs from gmw1-13o17, gmw1-8g7, gmw1-57d24, gmw1-58k3 and gmw1-27d24.</p>
               </tblfn>
            </tbl>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Summary of genic conservation from putative homeologous BACs in soybean</p>
               </caption>
               <text>
                  <p><b>Summary of genic conservation from putative homeologous BACs in soybean</b>. Duplicate genes from six soybean BACs (3 different pairs) show the range of gene conservation found in the soybean genome. Each block-arrow represents a predicted gene structure. Black arrows are genes with no homeolog. Colored arrows are genes with a homeolog. A heat map for percent nucleotide identity shows the average nucleotide identity between duplicate genes for each conserved homeolog. Gray boxes between structures show homoelogous relationships. All gene structure predictions are available online [30]. The first BAC pair has been reprinted with permission from The Plant Genome [19].</p>
               </text>
               <graphic file="1471-2164-8-330-1"/>
            </fig>
            <p>To visualize the level of nucleotide identity between BACs, VISTA plots for BACs anchored by the RFLP A711, cellulose synthase, galactinol synthase, raffinose synthase and caffeoyl-CoA O-methyltransferase (COMT) were generated [see Additional Files <supplr sid="S1">1</supplr>, <supplr sid="S2">2</supplr>, <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>]. VISTA identity plots as well as values for nucleotide identity, protein identity and protein similarity for HCBT and FAD2-anchored BACs have been previously reported [8,25 respectively]. Nucleotide identity between BACs is strongest in the coding regions and extends both 5' and 3' from predicted genes before dropping to below 50% between BACs with more duplicate gene conservation <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp>. This is likely due to retained non-coding sequences such as promoter elements between homeologous regions. However, as the level of gene conservation drops, so does the nucleotide identity beyond duplicate genes.</p>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p><b>Supplemental Figure 1</b>. VISTA identity plot between BACs GM_UMb001_24d13 and GM_UMb001_5f5. Each colored block represents a predicted gene structure from start to stop including introns with gray boxes between genes showing homoelogous relationships. The identity plots above and below each BAC structure show the nucleotide identity between each BAC based upon an annotation anchored global-pairwise alignment. The light purple boxes above each VISTA correspond to annotated exon positions. The GM_UMb001-24d13 selenium-binding gene appears shorter due to the coding region being in only exon 1; whereas the coding region of GM_UMb001-5f5 selenium-binding gene includes intronic sequence.</p>
               </text>
               <file name="1471-2164-8-330-S1.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S2">
               <title>
                  <p>Additional file 2</p>
               </title>
               <text>
                  <p><b>Supplemental Figure 2</b>. VISTA identity plot between BACs gmw2-133d1 and gmw1-93l19. Each colored block represents a predicted gene structure from start to stop including introns with gray boxes between genes showing homoelogous relationships. The identity plots above and below each BAC structure show the nucleotide identity between each BAC based upon an annotation anchored global-pairwise alignment. The light purple boxes above each VISTA correspond to annotated exon positions.</p>
               </text>
               <file name="1471-2164-8-330-S2.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S3">
               <title>
                  <p>Additional file 3</p>
               </title>
               <text>
                  <p><b>Supplemental Figure 3</b>. VISTA identity plot between BACs gmw1-103e11 and gmw1-5g16. Each colored block represents a predicted gene structure from start to stop including introns with gray boxes between genes showing homoelogous relationships. The identity plots above and below each BAC structure show the nucleotide identity between each BAC based upon an annotation anchored global-pairwise alignment. The light purple boxes above each VISTA correspond to annotated exon positions. The gmw1-5g16 RAD1-like gene is truncated relative to the gmw1-103e11 copy by a stop codon in the third exon. Both RAD1-like genes have complete EST support for gene structures. Similarly, the gmw1-5g16 galactinol synthase gene is truncated due to an EST supported alternative splicing event relative to the gmw1-103e11 copy. The gmw1-103e11 <it>A. thaliana</it>-like NAP gene covers only 5 of the 7 predicted exons with almost full EST support whereas the gmw1-5g16 copy covers all 7 exons with 100% EST support.</p>
               </text>
               <file name="1471-2164-8-330-S3.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S4">
               <title>
                  <p>Additional file 4</p>
               </title>
               <text>
                  <p><b>Supplemental Figure 4</b>. VISTA identity plot between BACs gmw1-8g7 and gmw1-13o17. Each colored block represents a predicted gene structure from start to stop including introns with gray boxes between genes showing homoelogous relationships. The identity plots above and below each BAC structure show the nucleotide identity between each BAC based upon an annotation anchored global-pairwise alignment. The light purple boxes above each VISTA correspond to annotated exon positions.</p>
               </text>
               <file name="1471-2164-8-330-S4.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <suppl id="S5">
               <title>
                  <p>Additional file 5</p>
               </title>
               <text>
                  <p><b>Supplemental Figure 5</b>. VISTA identity plot between BACs gmw1-57d24 and gmw1-58k3. Each colored block represents a predicted gene structure from start to stop including introns with gray boxes between genes showing homoelogous relationships. The identity plots above and below each BAC structure show the nucleotide identity between each BAC based upon an annotation anchored global-pairwise alignment. The light purple boxes above each VISTA correspond to annotated exon positions. A third BAC gmw1-27d20 is shown with homeologs to gmw1-57d24 and gmw1-58k3 but because this BAC is phase I (unordered contigs) no identity plots are show because the order of the contigs is unknown.</p>
               </text>
               <file name="1471-2164-8-330-S5.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>In a number of cases, homeologs appear to have varying gene lengths such as the selenium-binding protein found on BACs UMb001-24d13 and UMb001-5f5 (Figure <figr fid="F1">1</figr>, third homeolog) [see Additional file <supplr sid="S1">1</supplr>]. The exon number for this gene varies and a stop codon in the first exon of the UMb001-24d13 encoded selenium-binding protein truncates the resulting transcript (Table <tblr tid="T2">2</tblr>). There is however, EST-based support for the mRNA on UMb001-24d13 extending further 3' but the alignment is not a perfect match (92% identity). Other cases of variation in exon number between duplicate genes are observed (Table <tblr tid="T2">2</tblr>). Most of the differences can be accounted for in two ways: 1) <it>ab initio </it>based prediction of gene structures with little to no EST support vary between BACs and/or 2) truncation of one of the predicted genes due to an encoded stop codon. Reliance on <it>ab initio </it>predictions for gene structures combined with the lack of EST-based support can lead to differences between homeologs in exon number. In many cases, even alignment to putative orthologs could not verify the gene structure.</p>
            <p>Synonymous (Ks) and nonsynonymous (Ka) substitutions between all of the duplicate genes were calculated (Table <tblr tid="T2">2</tblr>). The average Ks value was 0.42398 and average Ka value was 0.05775. Again, the Ks and Ka values for HCBT and FAD2 BACs are previously reported <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp>. All Ks values gave an average divergence estimate of 34.75 Mya. This value likely is inflated due to the extensive divergence between the duplicate genes identified on gmw1-57d24, gmw1-58k3 and gmw1-57d24 and between raffinose synthase on gmw1-13o17 and gmw1-8g7. When these duplicate genes were excluded from the calculation, the average divergence estimate was 9.665 Mya, similar to previous estimates <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> but still more recent than EST-based estimates <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. When only the most divergent duplicate genes are used for coalescence estimates, a date of 153 Mya was obtained. Two caveats to divergence estimates should be noted: 1) The Ks values for the most divergent duplicate genes were for the most part well past saturation (greater than 1) and 2) in the most divergent regions, we cannot be certain that we are comparing homeologs and not paralogs (segmental or single gene duplications) without the context of the whole genome or more sequence in these regions. Only two pairs of homeologs showed evidence for positive selection; a ribonuclease HII encoding gene on gmw1-15k6 and gmw1-105h23 with a Ka/Ks ratio of 2.078 <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> and the RAD-like encoding gene from gmw1-103e11 and gmw1-5g16 with a Ka/Ks ratio of 1.023. All other retained homeologs appear to be under purifying selection for retained function.</p>
         </sec>
         <sec>
            <st>
               <p>Reassembly of paleoduplicate regions</p>
            </st>
            <p>To quantify the potential confounding effects of paleopolyploidy on soybean whole-genome shotgun sequence assembly (WGS), all of the sequencing traces for the 17 BACs discussed above were used in large-scale or batch assemblies. The goal was to determine what effect homeology between duplicated regions will have as the soybean genome is reconstructed. Base-calling and assemblies were performed using Phred and Phrap, respectively <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr><abbr bid="B33">33</abbr></abbrgrp> with default parameters and viewed in Consed <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>.</p>
            <p>To first test if standard assembly parameters could distinguish between the most conserved homeologous BACs, sequence trace files for gmw1-105h23 and gmw1-15k6 were combined into a single "batch" assembly. Figure <figr fid="F2">2</figr> shows that there is no cross assembly and no inclusion of sequencing traces between BACs. Assemblies were analyzed both manually and based upon BAC-specific tags to determine that sequence traces were assembled into the correct BAC contig. There are obvious regions with high levels of sequence identity between the BACs as determined by Crossmatch (Figure <figr fid="F2">2</figr>). Even with upwards of 97% sequence identity in exonic regions, sequence traces resolved into their correct "original" BACs. Quantification of the "batch-based" reassemblies against the original single-BAC assemblies was done using Vmatch <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. The three reassembled contigs for gmw1-105h23 had 99.58% sequence identity with 99.06% coverage to the original BAC assembly. Likewise, for gmw1-15k6 the resulting reassembly contigs had 99.80% sequence identity with 99.44% sequence coverage. As these results show, the assemblies were nearly identical to the original BAC assembly with the exception of small sequence gaps between the contigs, although clone pair ends clearly order and orient the contigs (Figure <figr fid="F2">2</figr>). Extrapolated to a whole-genome scale assembly, this shows that for soybean, unless there are regions of the genome that have higher levels of homeology than has been observed, the conserved paleopolyploidy of soybean will not have a substantial effect on the genome assembly.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Reassembly of highly identical homeologous soybean BACs</p>
               </caption>
               <text>
                  <p><b>Reassembly of highly identical homeologous soybean BACs</b>. Output of Phred/Phrap batch re-assembly of traces from gmw1-105h23 and gmw1-15k6 as viewed using Consed. Grey boxes represent the assembled contigs and are scaled in base pairs across each contig. Contig numbers are shown in pink boxes and are arbitrarily assigned by Phred/Phrap during sequence assembly. The blue and green boxes above each assembly show the predicted gene positions for gmw1-15k6 and gmw1-105h23, respectively. The green line-plot above each contig shows the average clone pair consistency. Sequence matches within and between contigs were determined with Cross-Match as part of Consed. Black lines within and between contigs show sequence matches that are in reverse orientation, while the orange lines show sequence matches in the same orientation. The bars between sequence matches correspond to the length of the match. Purple peak-shaped lines between contigs show clone pairs that span a gap. Below each contig is a purple line containing either blue (gmw1-15k6) or green (gmw1-105h23) tick marks; these are the tags that distinguish between traces from each BAC.</p>
               </text>
               <graphic file="1471-2164-8-330-2"/>
            </fig>
            <p>All of the 38,673 traces from all 17 BACs were then combined into a single assembly using both standard assembly parameters as well as various other parameter sets. Assemblies were quantified using three measures: 1) the number of contigs containing greater than 100 traces versus the original 35 contigs from individual BAC assemblies 2) average percent coverage of the reassembled contigs to original contigs and 3) average percent nucleotide identity of the reassembled contigs to the original contigs (Table <tblr tid="T3">3</tblr>). These last two values were determined by Vmatch analysis that performed a global pair-wise alignment between all of the reassembled contigs and original assembly contigs as described in materials and methods. Under all of the parameter sets, some contigs were split into multiple contigs thereby increasing the contig number to greater than the original 35.</p>
            <tbl id="T3">
               <title>
                  <p>Table 3</p>
               </title>
               <caption>
                  <p>Assessment and quantification of reassembly of duplicate BAC sequences</p>
               </caption>
               <tblbdy cols="8">
                  <r>
                     <c ca="center">
                        <p>Assembly number</p>
                     </c>
                     <c ca="center">
                        <p>Parameters</p>
                     </c>
                     <c ca="center">
                        <p>Total # contigs</p>
                     </c>
                     <c ca="center">
                        <p># contigs (> 100)<sup>a</sup></p>
                     </c>
                     <c ca="center">
                        <p>% Coverage of old contigs<sup>b</sup></p>
                     </c>
                     <c ca="center">
                        <p>% Identity to old contigs<sup>c</sup></p>
                     </c>
                     <c ca="center">
                        <p>% Coverage +103e11<sup>d</sup></p>
                     </c>
                     <c ca="center">
                        <p>% Identity +103e11<sup>d</sup></p>
                     </c>
                  </r>
                  <r>
                     <c cspan="8">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>1</p>
                     </c>
                     <c ca="center">
                        <p>standard</p>
                     </c>
                     <c ca="center">
                        <p>551</p>
                     </c>
                     <c ca="center">
                        <p>44</p>
                     </c>
                     <c ca="center">
                        <p>98.52%</p>
                     </c>
                     <c ca="center">
                        <p>99.07%</p>
                     </c>
                     <c ca="center">
                        <p>98.44%</p>
                     </c>
                     <c ca="center">
                        <p>97.39%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>2</p>
                     </c>
                     <c ca="center">
                        <p>revise_greedy</p>
                     </c>
                     <c ca="center">
                        <p>2538</p>
                     </c>
                     <c ca="center">
                        <p>45</p>
                     </c>
                     <c ca="center">
                        <p>91.41%</p>
                     </c>
                     <c ca="center">
                        <p>99.08%</p>
                     </c>
                     <c ca="center">
                        <p>92.74%</p>
                     </c>
                     <c ca="center">
                        <p>98.43%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>3</p>
                     </c>
                     <c ca="center">
                        <p>forcelevel 5</p>
                     </c>
                     <c ca="center">
                        <p>2140</p>
                     </c>
                     <c ca="center">
                        <p>40</p>
                     </c>
                     <c ca="center">
                        <p>96.13%</p>
                     </c>
                     <c ca="center">
                        <p>99.21%</p>
                     </c>
                     <c ca="center">
                        <p>95.56%</p>
                     </c>
                     <c ca="center">
                        <p>98.52%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>4</p>
                     </c>
                     <c ca="center">
                        <p>minmatch 30</p>
                     </c>
                     <c ca="center">
                        <p>2184</p>
                     </c>
                     <c ca="center">
                        <p>50</p>
                     </c>
                     <c ca="center">
                        <p>94.77%<sup>e</sup></p>
                     </c>
                     <c ca="center">
                        <p>98.92%<sup>e</sup></p>
                     </c>
                     <c ca="center">
                        <p>95.51%</p>
                     </c>
                     <c ca="center">
                        <p>97.91%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>5</p>
                     </c>
                     <c ca="center">
                        <p>forcelevel 3</p>
                     </c>
                     <c ca="center">
                        <p>2326</p>
                     </c>
                     <c ca="center">
                        <p>43</p>
                     </c>
                     <c ca="center">
                        <p>98.40%</p>
                     </c>
                     <c ca="center">
                        <p>98.60%</p>
                     </c>
                     <c ca="center">
                        <p>97.74%</p>
                     </c>
                     <c ca="center">
                        <p>97.96%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>6</p>
                     </c>
                     <c ca="center">
                        <p>forcelevel 5 minmatch 30</p>
                     </c>
                     <c ca="center">
                        <p>1781</p>
                     </c>
                     <c ca="center">
                        <p>43</p>
                     </c>
                     <c ca="center">
                        <p>88.75%<sup>e</sup></p>
                     </c>
                     <c ca="center">
                        <p>99.18%<sup>e</sup></p>
                     </c>
                     <c ca="center">
                        <p>86.17%</p>
                     </c>
                     <c ca="center">
                        <p>98.04%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="center">
                        <p>7</p>
                     </c>
                     <c ca="center">
                        <p>forcelevel 3 minmach30</p>
                     </c>
                     <c ca="center">
                        <p>1950</p>
                     </c>
                     <c ca="center">
                        <p>46</p>
                     </c>
                     <c ca="center">
                        <p>93.38%<sup>f</sup></p>
                     </c>
                     <c ca="center">
                        <p>99.18%<sup>f</sup></p>
                     </c>
                     <c>
                        <p/>
                     </c>
                     <c>
                        <p/>
                     </c>
                  </r>
               </tblbdy>
               <tblfn>
                  <p><sup>a </sup>Total number of contigs that contain greater than 100 sequence traces</p>
                  <p><sup>b </sup>Total length of the resulting contigs (not including any overlapping regions) divided by the length of the originally assembled BAC</p>
                  <p><sup>c </sup>Percent identity as calculated from Vmatch</p>
                  <p><sup>d </sup>Recalculated percent coverage and percent identity to include contigs containing traces from gmw1-103e11; these contigs did not meet the 80% sequence identity cutoff for Vmatch</p>
                  <p><sup>e </sup>One contig from gmw1-103e11 met the cutoff criteria of 80% sequence identity for Vmatch and was included in this estimation. The second contig was included in the +103e11 calculations</p>
                  <p><sup>f </sup>This parameter set matches the parameter set that was determined to give the best reassembly of gmw1-103e11 as a single BAC reassembly. Both resulting contigs met the 80% sequence identity cutoff for Vmatch and are included in these averages.</p>
               </tblfn>
            </tbl>
            <p>Experimental parameters were varied in an attempt to increase the percent coverage and percent nucleotide identity of the batch assemblies. The first parameter, revise_greedy, split initial contig assemblies at weak joins (regions that may be misassembled between duplicate regions due to sequence identity) and then attempted to reattach them for a higher overall alignment score. While only barely increasing the percent identity score, the percent coverage score was reduced by just over 7%. The forcelevel flag specifically reduced the stringency during the final contigs merge pass with 0 being most stringent and 10 least stringent, standard parameters using 0. When the forcelevel was relaxed slightly to 3, the percent coverage was nearly the same with only a slight drop in percent identity. However, increasing forcelevel to 5 decreased the percent coverage by just over 2% but increased the percent identity by over a full percent. It also had the effect of reducing the number of contigs from 44 at forcelevel 0 to 40 at forcelevel 5. Finally, the minmatch value was adjusted from 14 (standard) to 30 to increase the assembly stringency, a modification that dramatically increased the number of contigs to 50, as expected, and dropped the overall percent coverage. Combinations of these parameter changes also were investigated and the results are given as assemblies 6 and 7. Overall, it appears that standard Phred/Phrap assembly parameters return the greatest percent coverage out of all assemblies as well as the nearly best percent identity to the original contig assemblies.</p>
         </sec>
         <sec>
            <st>
               <p>Sources of potential assembly errors</p>
            </st>
            <p>Two potential sources of assembly error were identified in this analysis. First, under the last three assembly conditions (assemblies 5&#8211;7, Table <tblr tid="T3">3</tblr>) a contig from gmw1-27d20 and from GM_UMb-5f5 were incorrectly merged at a large (TATA)<sub>n </sub>simple sequence repeat region. The resulting contig clearly shows the transition from one BAC to the other across the TA repeat with low quality sequences and low sequence coverage flanking the repeat. Lower quality sequences are not uncommon with simple sequence repeats that are large in length as these regions are difficult to sequence through. Secondly, the assembly of BAC gmw1-103e11 was especially troublesome in both the "batch" assembly of all of the BACs and on an individual assembly scale. Table <tblr tid="T3">3</tblr> shows how the inclusion of the 103e11 contigs (which in most cases did not meet the Vmatch parsing criteria as is noted in Table <tblr tid="T3">3</tblr>) lowers both the average percent coverage and percent identity across the assembly.</p>
            <p>Under standard assembly conditions, the 89,397 bp BAC gmw1-103e11 is fragmented into two contigs, a 19,452 bp contig with clone pair matches to the middle of the larger 69,905 bp contig. Clearly, a region from the middle of gmw1-103e11 is misassembled into a separate contig. This region can be partially resolved without manual reassembly by changing the forcelevel to 3 and minmatch to 30. The assembly still results in two contigs, but this is due to a gap in the middle of the contig and not exclusion of a region in the middle of the contig as with standard assembly parameters. The overall sequence coverage is 84.7% and sequence identity of 82.49% to the original BAC sequence. When this parameter set is used to reassembly all of the BACs however, it reduces the percent coverage by just over 5% but does increase the percent identity by almost 2% (Table <tblr tid="T3">3</tblr>).</p>
            <p>This then raised the question as to what in the gmw1-103e11 sequence could be causing the re-assembly (both individual BAC and in the context of all BACs) to generate a second contig from the middle of the BAC. Utilizing Vmatch to identify sequence matches within the region being misassembled, non-retroelement, highly identical unique repeats (blue rectangles on Figure <figr fid="F3">3</figr>) were identified. Two major repeats occur in tandem in this region; a 566 bp repeat that is 96% identical (labelled as A and A' on Figure <figr fid="F3">3</figr>) and a <figr fid="F1">1</figr>, 198 bp repeat that is 95% identical (labelled as B and B' on Figure <figr fid="F3">3</figr>). Repeat A is present in the first unknown gene, repeat B in the pentatricopeptide repeat (PPR)-like 1 gene and both of the secondary repeat copies, A' and B' are contained within the PPR-like 2 gene (Figure <figr fid="F3">3</figr>).</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Repetitive sequences in BAC gmw1-103e11</p>
               </caption>
               <text>
                  <p><b>Repetitive sequences in BAC gmw1-103e11</b>. Gene positions and repetitive sequences found in the region of 30,000 bp to 53,000 bp on gmw1-103e11. Predicted gene structures are shown as green boxes and arrows, with the boxes representing exons and lines being introns. Black tick marks on a gene show the start position of a repeated PPR domains within the gene. The blue boxes show the repetitive sequences identified by Vmatch. Orange gene alignments reflect the realignment of predicted gene structures back to the genomics sequence.</p>
               </text>
               <graphic file="1471-2164-8-330-3"/>
            </fig>
            <p>GeneSeqer alignments <abbrgrp><abbr bid="B36">36</abbr></abbrgrp> were generated of each predicted gene structure from this region realigned to the gmw103e11 BAC sequence. A portion of the PPR-like 2 gene aligns to the region predicted to contain the PPR-like 1 and unknown genes (Figure <figr fid="F3">3</figr>; orange gene structures). Similarly, the PPR-like 1 gene aligns to a portion of PPR-like 2. All of these alignments were using the "moderate" stringency function of GeneSeqer. The two predicted PPR-like genes in this region vary greatly in their structures and lengths. As discussed above, often there is little to no EST support and <it>ab initio </it>predictions must be relied upon. For this region, the first unknown gene has 7 ESTs with only 90% sequence identity that support the last exon, the rest of the gene is based upon <it>ab initio </it>predictions. The phosphotransferase and second unknown gene have nearly full EST support. Both of the PPR-like genes, however, are completely <it>ab initio </it>predicted.</p>
            <p>Although there is variation in the predicted structures of the PPR-like genes, BLASTP annotation identified conserved petatricopeptide repeat (PPR) repeats in both. PPR repeats are a degenerate ~30 amino acid motif that occur tandemly multiple times within a protein <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. To identify potential PPR repeats across this region, MEME and MAST were used to generate PPR motifs and search the gmw1-103e11 BAC sequence for all possible occurrences of the motif <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. Two PPR repeats were found in the first intron of the predicted unknown gene, at least six PPR repeats were identified in the PPR-like 1 gene and eleven repeats were identified in the PPR-like 2 gene. These PPR repeats are 81&#8211;99 nucleotides in length that range from 25&#8211;100% similar at the amino acid level and 33&#8211;95.8% similar at the nucleotide level (within and between both PPR-like genes). The black lines on Figure <figr fid="F3">3</figr> show the start location of the PPR domains that are located end to end within the coding sequence. These repeats account for the Vmatch identified repeat sequences A/A' and B/B'. The similarity of a portion of PPR-like 2 to both the first unknown gene and PPR-like 1 suggests two scenarios: 1) PPR-like 2 is incorrectly predicted and should be two separate genes or 2) PPR-like 2 is incorrectly predicted and should be fused with the first unknown gene. In either case, these PPR containing genes and repeats are the source of assembly error, as discussed below.</p>
            <p>Identified repeats A/A', B/B' and all of the predicted genes from this region of gmw1-103e11 were re-aligned using GeneSeqer to the Phred/Phrap re-assembled gmw1-103e11 contigs. Both of the PPR-like gene structure predictions as well as the repeat A containing unknown gene align to a ~3,500 bp region in the middle of the 69,905 bp major contig. This region also contains clone pair matches to both ends of the 19,452 bp secondary contig. What has occurred is the PPR-containing regions are above the threshold of distinguishing one copy from another and have collapsed into a single structure in the larger contig. The phosphotransferase gene and second unknown gene are excluded from this region and placed in the separate contig. These results show that highly identical tandemly duplicated genes, especially those genes that themselves contain repetitive domains will be a potential source of assembly errors. In this case, the structure of the PPR repeats across the PPR-like genes cannot be resolved without manual curation of the assembly.</p>
         </sec>
         <sec>
            <st>
               <p>Composition of whole-genome shotgun sequence assembly</p>
            </st>
            <p>To determine how well our assemblies were screening for highly repetitive sequence, a preliminary assembly using standard Phred/Phrap parameters of 80,000 randomly chosen JGI trace files was done. Contigs containing greater than 15 traces were considered highly represented even after initial trace screening against known repetitive sequences. Each of these contigs was subject to a BLAST-based annotation against the NCBI nonredundant database and then clustered into groups based upon that annotation (Figure <figr fid="F4">4</figr>). Surprisingly, 23% of the JGI contigs showed no sequence identity to any anything in the NCBI nonredundant database. However, when the contigs comprising this 23% are BLASTed against the repetitive database generated by Gill et al. <abbrgrp><abbr bid="B39">39</abbr></abbrgrp> only 5 contigs out of 44 had no match and 7 contigs had a bit-score less than 90 and were considered poor matches. Forty thousand randomly chosen JGI trace files were combined with the 36,978 BAC generated trace files in a standard Phred/Phrap assembly. The addition of the JGI whole-genome shotgun generated trace files had no effect on either the percent identity of the reassembled contigs (99.07%) or on the percent coverage (98.52%).</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Sequence composition of highly represented sequences in a small-subset of JGI sequence traces</p>
               </caption>
               <text>
                  <p><b>Sequence composition of highly represented sequences in a small-subset of JGI sequence traces</b>. A pie-chart representation of repetitive sequences from assembly of 80,000 JGI soybean whole-genome shotgun trace files. BAC corresponds to any contig that showed greatest identity to already assembled soybean BAC sequence. Mdh refers to a previously sequenced region of soybean containing repetitive sequence. No hit means that there was no blast-based match to the nonredundant database. Other was a best match to a sequence (BAC or genomic) from another organism that was not characterized. Satellite refers to known Sb92 or Str120 centromeric repeat sequences. The rest of the categories are as described in the figure legend.</p>
               </text>
               <graphic file="1471-2164-8-330-4"/>
            </fig>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>In this analysis, we have characterized homeologous sequences from the paleopolyploid soybean genome and studied the effect of conserved duplicate regions on sequence assembly. Identified BACs map to 11 of the 20 soybean linkage groups representing a broad sampling of potential homeologous regions across the soybean genome. Previous analyses have shown fairly extensive sequence conservation between homeologous blocks in soybean <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp>. Sequenced BACs identified as containing transcribed duplicate genes show a range of gene conservation (Figure <figr fid="F1">1</figr>; Additional Files <supplr sid="S1">1</supplr>, <supplr sid="S2">2</supplr>, <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>: Supplemental Figures <figr fid="F1">1</figr>, <figr fid="F2">2</figr>, <figr fid="F3">3</figr>, <figr fid="F4">4</figr>).</p>
         <p>Early analysis of the structure and organization of a paleopolyploid genome have been in maize. The "maize model" suggests that the present maize genome is a result of extensive reciprocal deletions as well as major transposable element insertions causing genome expansion and contraction resulting in homeologous regions that are not well conserved <abbrgrp><abbr bid="B5">5</abbr><abbr bid="B7">7</abbr><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr></abbrgrp>. Conversely, in cotton, a relatively recent allotetraploid, the homologs studied were highly conserved with only small indels and transposable element insertions differing between regions <abbrgrp><abbr bid="B11">11</abbr></abbrgrp>. The "cotton model" suggests strong duplicate gene conservation that extends well into the intergenic regions. In this analysis we find that the soybean genome is a mosaic of these two models with a range of conservation spanning from gene for gene retention <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> to moderately conserved regions with 25 to 50% gene retention <abbrgrp><abbr bid="B8">8</abbr></abbrgrp> and highly divergent regions with a single gene conserved (Figure <figr fid="F1">1</figr>).</p>
         <p>Coalesence estimates suggest that the most of the regions diverged approximately 9.6 Mya. This value falls within the range of what has previously been observed <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp>. On the extreme end, however, five BACs contain highly divergent duplicate genes. These may indeed be the result of gene translocation, segmental or single gene duplication and not the result of polyploidy. While in the absence of the whole genome sequence we cannot be certain of the mechanism by which these genes duplicated, some support for at least a larger duplication event is found from the genetic map. Mapping of duplicate RFLP markers in soybean provided early evidence for a major genome duplication event <abbrgrp><abbr bid="B12">12</abbr></abbrgrp>. Utilizing the most recent genetic map <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>, linkage groups D1a and D1b (where gmw1-57d24 and gmw1-27d20 map, respectively) were found to contain an RFLP A725 that is duplicated between these linkage groups. In addition, D1b and O (where gmw1-27d20 and gmw1-58k3 map, respectively) both contain the RFLP K011 duplicated between linkage groups. While the linkage positions of these markers are separated by many centimorgans (data not show), it does lend credence to these linkage groups having a shared ancestry. A similar comparison for gmw1-13o17 and gmw1-8g7 could not be done because gmw1-8g7 is unmapped. Regardless of the mechanism, in soybean, there are regions of paleoduplicated chromosomes that have diverged greatly since duplication while others have not (Figure <figr fid="F1">1</figr>) [see Additional files <supplr sid="S1">1</supplr>, <supplr sid="S2">2</supplr>, <supplr sid="S3">3</supplr>, <supplr sid="S4">4</supplr>, <supplr sid="S5">5</supplr>].</p>
         <p>Size differences between duplicate genes were observed on many of the BACs (Table <tblr tid="T2">2</tblr>). Even though on average 59% of the predicted genes had some EST support, the reliance on <it>ab initio </it>predictions results in variation between duplicate genes in gene structure predictions. A similar issue is observed with the PPR-like genes on gmw1-103e11 that are a potential source of batch assembly error. In addition, the varying levels of protein identity in homeologous regions may be the result of unsupported gene structure predictions. This analysis clearly shows that for improved annotation of the whole genome assembly, more transcript (EST, cDNA, etc.) sequences will be necessary to verify predicted gene structures.</p>
         <p>Most plant genome sequencing efforts have been BAC-based using highly inbred plants with pseudo-monoploid genomes (diploid or polyploid plants with identical paleoduplicated genomes). As a result, plant genome assemblies have not been confounded by the effects of retained homeology in paleopolyploid regions of the genome. Conversely, many of the non-plant eukaryotic sequencing efforts have been WGS such as <it>Fugu rubripes </it><abbrgrp><abbr bid="B40">40</abbr></abbrgrp>, mouse <abbrgrp><abbr bid="B41">41</abbr><abbr bid="B42">42</abbr></abbrgrp>, and the Celera version of the human genome <abbrgrp><abbr bid="B43">43</abbr><abbr bid="B44">44</abbr></abbrgrp> to name only a few. Comparisons between the WGS project and BAC-based sequencing project in humans have found that while the WGS provides more accurate gene coverage more quickly, the BAC-based sequencing has much better coverage of repetitive sequences, especially highly conserved repeats and in the long run is more accurate in both order and orientation of genes <abbrgrp><abbr bid="B44">44</abbr><abbr bid="B45">45</abbr><abbr bid="B46">46</abbr><abbr bid="B47">47</abbr></abbrgrp>. A somewhat similar comparison between the <it>Oryza sativa </it>L. ssp. <it>indica </it><abbrgrp><abbr bid="B48">48</abbr></abbrgrp> and <it>Oryza sativa </it>L. ssp. <it>japonica </it><abbrgrp><abbr bid="B49">49</abbr></abbrgrp> sequencing projects concluded that the major differences in sequence assemblies are due to regions with large transposable elements <abbrgrp><abbr bid="B50">50</abbr></abbrgrp>.</p>
         <p>The soybean genome is a well-documented paleopolyploid <abbrgrp><abbr bid="B12">12</abbr><abbr bid="B51">51</abbr></abbrgrp> as are all sequenced plants, e.g., Arabidopsis <abbrgrp><abbr bid="B52">52</abbr></abbrgrp>, rice <abbrgrp><abbr bid="B48">48</abbr><abbr bid="B49">49</abbr><abbr bid="B53">53</abbr><abbr bid="B54">54</abbr></abbrgrp> and most recently Poplar <abbrgrp><abbr bid="B55">55</abbr></abbrgrp>. Although homeologous blocks could be identified in each of these species, even the most recent polyploidy events are thought to be more ancient than what has been described in soybean <abbrgrp><abbr bid="B19">19</abbr><abbr bid="B20">20</abbr></abbrgrp>. The often high levels of sequence conservation in homeologous regions in soybean <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp> has raised the question of what effect this will have on the assembly of the whole-genome shotgun sequence effort (WGS) currently underway.</p>
         <p>The reassembly of 17 homeologous BACs in soybean provides the first look at the effects a relatively conserved paleopolyploid genome on WGS assembly. The most identical homeologous BACs sequenced, gmw1-105h23 and gmw1-15k6 are just under 95% identical across both the BAC coding and noncoding regions (Table <tblr tid="T2">2</tblr>) <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Reassembly of these two BACs showed no misassembly of the BACs and no cross-assembly of trace files from one BAC in the other BAC (Figure <figr fid="F2">2</figr>). In the context of the WGS assembly, this is good news for homeologous regions that share less than 95% sequence identity. Under standard assembly parameters using Phrep/Phrap, paleoduplicate homeologous regions should be resolvable.</p>
         <p>When all 17 BACs are reassembled in batch, observed assembly errors are the results of tandem duplications and simple sequence repeats. Analysis of the re-assembled BAC gmw1-103e11 shows that tandem duplications of genes such as the PPR-like genes with sequence identity greater than 95% may cause assembly issues. Using a standard set of parameters, clone pairs cannot be distinguished, especially when the repeat is larger than the sequence reads (generally over 500 bp). The parameter set that better resolves tandem repeats may not be the appropriate parameter set for all assemblies; as a result, hand assembly of these regions may be necessary for completion of genome assembly. Similarly, large simple sequence repeats may cause incorrect merging of regions. It should be noted however, if there are homeologous regions of the soybean genome that are conserved with greater than 95% sequence identity, they will likely behave in a manner similar to tandem duplications and may be more difficult to distinguish.</p>
         <p>What was not observed in the batch reassembly was errors caused by retrotransposon sequences. In soybean, many of the potential retrotransposons have not been characterized although a number of studies are underway to identify repetitive sequences in soybean Marek et al. unpublished results <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>. This analysis, with one exception, did not identify BACs that contained numerous repetitive sequences; instead they were found to be gene rich. BAC gmw1-45m6 <abbrgrp><abbr bid="B25">25</abbr></abbrgrp> does contain numerous LTR retrotransposons, but re-assembly of this BAC showed few errors. Cytogenetic studies have shown that the high-copy sequences in soybean are highly concentrated to centromeric and pericentromeric regions <abbrgrp><abbr bid="B24">24</abbr><abbr bid="B56">56</abbr></abbrgrp>. In addition, ongoing analysis of repetitive sequence in soybean shows that it is primarily in the centric, telomeric and nucleolar organizing regions of the genome (Gill et al. unpublished results) <abbrgrp><abbr bid="B26">26</abbr></abbrgrp>. Contrary to maize or some species of rice <abbrgrp><abbr bid="B10">10</abbr><abbr bid="B57">57</abbr></abbrgrp>, no evidence for a large burst of retrotransposon activity has been found in soybean. It is likely then, that in the context of WGS assembly, retrotransposon sequences in most cases will not affect assembly of genic regions.</p>
         <p>Preliminary analysis of contigs generated from JGI trace files give an estimation of what repetitive sequences will need to be screened for during WGS assembly (Figure <figr fid="F4">4</figr>). Even though the 80,000 JGI traces were prescreened against characterized soybean repeats, those trace files that contain a fragment of a repeat are passing through the screening process. Further, there are enough sufficient sequences that assemble to regenerate the original repetitive sequence into a contig, or at least enough of the sequence to match back to characterized repeats. One previously noted consequence of WGS assembly is that the exclusion of transposable element sequences and repetitive sequences during assembly has the effect of eliminating genes that might be found in these regions <abbrgrp><abbr bid="B45">45</abbr></abbrgrp>. In this case, genic sequences that flank or are contained in repetitive regions may be able to pass through the repeat screening such that they become part of the assembly. A balance between screening for repetitive sequences during WGS assembly while not excluding genic information will need to be found.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>This analysis has shown that the soybean genome is a mosaic of sequence conservation models for a paleopolyploid genome with some regions retaining all duplicate genes while other regions retain only one divergent duplicate gene. With this in mind, a study to determine how paleopolyploidy would affect whole genome shot-gun sequence assembly was undertaken. Our results have shown that even the most conserved homeologous BACs with upwards of 95% sequence identity show no cross-assembly (inclusion of sequence traces from one BAC into the other BAC). In addition, potential sources of assembly error were identified as tandem duplications with greater than 95% sequence identity and large simple sequence repeats.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Identification, sequencing and single BAC assembly of duplicate BACs</p>
            </st>
            <p>BACs gmw1-74i13 and gmw1-52d3, corresponding to duplicate loci anchored by N-hydroxycinnamoyl benzoyltransferase (HCBT) genes, were identified, sequenced and annotated by Schlueter <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Four BACs, gmw1-15k6, gmw1-105h23, gmw1-11j16 and gmw1-45m6 anchored by &#969;-6 fatty acid desaturase (FAD2) genes were identified, sequenced and annotated by Schlueter <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. BACs anchored by the RFLP probe A711 with known cytogenetic information <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. GM_UMb-24d13 and GM_UMb-5f5 were used to construct shotgun libraries for sequencing and assembly as described previously <abbrgrp><abbr bid="B56">56</abbr></abbrgrp>.</p>
            <p>Retained duplicate transcripts corresponding to isoflavone synthase/cellulose synthase, galactinol synthase, raffinose synthase and caffeoyl-CoA o-methyltransferase were identified with TBLASTX (default parameters) using a reference sequence against all soybean ESTs <abbrgrp><abbr bid="B58">58</abbr></abbrgrp>. Identified ESTs were aligned into contigs using Sequencher v.4.5, also with default parameters (Gene Codes Corp., MI). PCR primers were designed to distinguish between copies using Oligo 6.82 (Molecular Biology Insights, Cascade, CO) [see Additional file <supplr sid="S6">6</supplr>]. Multidimensional pools of the Williams 82 <it>G. max </it>BAC library (gmw1) were PCR screened. BAC DNA was isolated using a Plasmid Midi kit (Qiagen, Valencia CA) and reverified with PCR as previously described <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>.</p>
            <suppl id="S6">
               <title>
                  <p>Additional file 6</p>
               </title>
               <text>
                  <p><b>Supplemental Table 1</b>. Contains homeolog-specific primer sequences used to identify BACs for sequencing. Both forward and reverse primers as well as their size and the BAC they identified are shown. Primers for BACs gmw1-52d3 and gmw1-74i13 are found in <abbrgrp><abbr bid="B8">8</abbr></abbrgrp> and primer for gmw1-105h23, gmw1-15k6 and gmw1-11j16 are found in <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>.</p>
               </text>
               <file name="1471-2164-8-330-S6.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
            <p>BACs gmw1-13o17 and gmw1-8g7 were subcloned and assembled as described in Schlueter <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Subclones were sequenced at the Iowa State DNA Sequencing and Synthesis Facility (Ames, Iowa). Sequence for BACs gmw2-133d1, gmw1-93l19, gmw1-5g16, gmw1-103e11, gmw1-58k3, gmw1-57d24 and gmw1-27d20 was generated at the University of Oklahoma using conditions previously described <abbrgrp><abbr bid="B59">59</abbr><abbr bid="B60">60</abbr><abbr bid="B61">61</abbr><abbr bid="B62">62</abbr><abbr bid="B63">63</abbr></abbrgrp>. Accession numbers for all sequenced BACs can be found in Table <tblr tid="T1">1</tblr>.</p>
         </sec>
         <sec>
            <st>
               <p>Mapping of duplicate BACs</p>
            </st>
            <p>BACs were mapped using two methods. First, already mapped EST-based SNPs were identified by BLASTN of annotated genes from each BAC against mapped ESTs <abbrgrp><abbr bid="B10">10</abbr></abbrgrp>. Only ESTs that match to BAC-derived genes with an e-value of 0.0 (near identical match) were considered. In addition, each EST was aligned to the BAC to confirm that it corresponded to one homeolog (or paralog) versus the other. Secondly, each BAC that was not previously mapped was scanned for di- and tri-nucleotide repeats using Sputnik (Espresso Software Development, Seattle WA). Primer pairs flanking the potential SSR markers were designed using Oligo 6.82 (Molecular Biology Insights) and tested against various soybean parents of mapping populations. PCR reactions were 10 &#956;l in volume and contained 1 &#215; PCR buffer, 1.5 mM magnesium chloride, 5 mM dNTPs, 0.5 &#956;M each primer, 50 ng <it>Glycine max </it>parental DNA, and 0.025 U of Taq DNA polymerase (Invitrogen). PCR cycling conditions were 94&#176;C for 2 min, 35 cycles of 94&#176; for 45 sec, 60&#176; for 30 sec, 72&#176; for 45 sec, followed by a final extension of 72&#176; for 3 min. Resulting bands were run on either a 3% agarose 1 &#215; TAE (Tris, Acetic Acid, EDTA) gel for larger (greater than 250 bp) products or 6% polyacrylamide 0.5 &#215; PBE gel for smaller fragments. Polymorphic SSRs from each BAC were mapped in the <it>Glycine max </it>A81-356022 X <it>Glycine soja </it>PI 468.916 population <abbrgrp><abbr bid="B64">64</abbr><abbr bid="B13">13</abbr></abbrgrp>. Genetic map positions of these SSRs were determined using MapMaker/Exp 3.0 with a minimum lod score of 3.0 <abbrgrp><abbr bid="B64">64</abbr><abbr bid="B65">65</abbr></abbrgrp>. Sequences for these SSRs are available [see Additional file <supplr sid="S7">7</supplr>].</p>
            <suppl id="S7">
               <title>
                  <p>Additional file 7</p>
               </title>
               <text>
                  <p><b>Supplemental Table 2</b>. Contains primers that amplify simple sequence repeats for mapping designed from homeologous BACs. Primers for BACs gmw1-52d3 and gmw1-74i13 are found in <abbrgrp><abbr bid="B8">8</abbr></abbrgrp> and primer for gmw1-105h23, gmw1-15k6 and gmw1-11j16 are found in <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>.</p>
               </text>
               <file name="1471-2164-8-330-S7.pdf">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Annotation of BACs</p>
            </st>
            <p>Gene prediction was done using a combination of ab initio and EST-alignment based methods as previously detailed <abbrgrp><abbr bid="B8">8</abbr><abbr bid="B25">25</abbr></abbrgrp>. Annotation was completed using yrGATE and viewed as part of the xGDB system <abbrgrp><abbr bid="B66">66</abbr><abbr bid="B67">67</abbr></abbrgrp>. A database with annotations was created called GmaxGDB <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. Each predicted gene was subjected to a BLASTP query of the NCBI nr database with default parameters to assign a putative function. An e-value threshold of 1<sup>e-10 </sup>was used to assign putative function.</p>
         </sec>
         <sec>
            <st>
               <p>Determination of homeologs and divergence estimates</p>
            </st>
            <p>Alignment of homeologous BACs used shuffle-LAGAN <abbrgrp><abbr bid="B68">68</abbr></abbrgrp> with default parameters anchored by predicted gene structures producing a VISTA plot <abbrgrp><abbr bid="B69">69</abbr></abbrgrp>. The nucleotide and protein percent identity and similarity of homeologs, was calculated using WATER, a pairwise alignment program (gap penalty of 10; extension penalty of 0.2; EMBOSS)<abbrgrp><abbr bid="B70">70</abbr></abbrgrp>. Synonymous and nonsynonymous distances were calculated using PAML, default parameters <abbrgrp><abbr bid="B71">71</abbr></abbrgrp>. Coalesence estimates were calculated as in <abbrgrp><abbr bid="B20">20</abbr></abbrgrp>.</p>
         </sec>
         <sec>
            <st>
               <p>Batch sequence assembly and quantification of assemblies</p>
            </st>
            <p>Trace files for all of the assembled BACs were combined into a single assembly utilizing 36,978 sequence reads. Base calling and sequence assemblies were performed using the Phred <abbrgrp><abbr bid="B31">31</abbr><abbr bid="B32">32</abbr></abbrgrp> and Phrap <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>, respectively. Assemblies were viewed using the Consed viewer and Cross-Match <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. All assemblies were run with standard Phred/Phrap parameters unless otherwise noted in the text or table. Briefly, parameters that were varied were: 1) revise_greedy that splits initial contig assemblies at weak joins (regions that may be misassembled due to high sequence identity) and then attempts to reattach them for a higher overall alignment score. 2) forcelevel reduces the stringency during the final contig merge pass and 3) minmatch which is the minimum length of a matching word in sequence comparisons during assembly. Further explanation of each parameter is found in the Phrap documentation <abbrgrp><abbr bid="B33">33</abbr></abbrgrp>.</p>
            <p>Previously characterized repetitive sequences from soybean available at the time of assembly were included in prescreening during assembly (Marek et al. unpublished results) <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>. Quantification of assemblies was done using Vmatch for large-scale sequence matching (a large-scale global sequence alignment)<abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. This program returns the percent nucleotide identity as well as the start and stop position for each contig alignment to allow for the calculation of percent coverage. Only contigs that contained greater than 100 traces were included in the analysis.</p>
            <p>Trace files from the soybean whole-genome shotgun sequencing effort were downloaded from the NCBI trace archive <abbrgrp><abbr bid="B72">72</abbr></abbrgrp>. These files are reads all uploaded from August 9&#8211;10, 2006 (ti's range from 1397334945 &#8211; 1399236113) to for a total of 80,000 sequencing reads. To determine the sequence composition of the JGI-only assemblies, contigs contained greater than 15 traces were blasted against the nr database to assign a putative annotation. These contigs were assumed to represent what will be observed at a high frequency in the whole-genome assemblies.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>List of abbreviations</p>
         </st>
         <p>BAC &#8211; bacterial artificial chromosome; WGS &#8211; whole genome shotgun; SSR &#8211; simple sequence repeat; RFLP &#8211; restriction fragment length polymorphism; Ks &#8211; synonymous substitution; Ka &#8211; nonsynonymous substitution; Mya &#8211; million years ago; bp &#8211; base pair</p>
      </sec>
      <sec>
         <st>
            <p>Competing interests</p>
         </st>
         <p>The author(s) declares that there are no competing interests.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>JAS designed this study, sequenced BACs, annotated BACs, designed primers for mapping of BACs, performed sequence alignments and divergence estimates, carried out all of the batch sequence assemblies and quantification of those assemblies and drafted the manuscript. JYL identified and sequenced BACs anchored by the RFLP clones A711 and participated in drafting the manuscript. SDS developed and set up the GmaxGDB database that was utilized for annotation of BACs and aided in the quantification of assemblies. IFVS, SD, JY and MO participated in sequencing of BACs. BAR coordinated sequencing of BACs and helped to draft the manuscript. RTN participated in annotating BACs. BES carried out sequencing of BACs. SAJ and RCS helped to design this study as well as draft the manuscript. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>The authors would like to thank Mary Duke and Xiaofen Liu for their sequencing expertise. We would also like to thank Jody Hayes, Terry Olsen and Michelle Griffin for their skills in mapping SSR markers and Greg Peiffer for his assistance in identifying, sub-cloning and gap-closing of BACs. J.A. Schlueter was supported by a grant from the United Soybean Board during part of this research. Names are necessary to report factually on the available data; however, the USDA neither guarantees nor warrants the standard of the product, and the use of the name by the USDA implies no approval of the product to the exclusion of others that may also be suitable. This article is a contribution of the Corn Insect and Crop Genetics Research Unit (USDA-ARS).</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>Stomatal size in fossil plants: evidence for polyploidy in majority of angiosperms</p>
            </title>
            <aug>
               <au>
                  <snm>Masterson</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>1994</pubdate>
            <volume>264</volume>
            <fpage>421</fpage>
            <lpage>424</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.264.5157.421</pubid>
                  <pubid idtype="pmpid" link="fulltext">17836906</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>Polyploidy and genome evolution in plants</p>
            </title>
            <aug>
               <au>
                  <snm>Adams</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Current Opin Plant Biol</source>
            <pubdate>2005</pubdate>
            <volume>8</volume>
            <fpage>135</fpage>
            <lpage>141</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1016/j.pbi.2005.01.001</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>Plant conserved non-coding sequences and paralogue evolution</p>
            </title>
            <aug>
               <au>
                  <snm>Lockton</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gaut</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Trends in Genet</source>
            <pubdate>2005</pubdate>
            <volume>21</volume>
            <fpage>80</fpage>
            <lpage>86</lpage>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Evolution of genome size: new approaches to an old problem</p>
            </title>
            <aug>
               <au>
                  <snm>Petrov</snm>
                  <fnm>DA</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2001</pubdate>
            <volume>17</volume>
            <fpage>23</fpage>
            <lpage>28</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0168-9525(00)02157-0</pubid>
                  <pubid idtype="pmpid" link="fulltext">11163918</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>A complex history of rearrangement in an orthologous region of the maize, sorghum, and rice genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Ilic</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>SanMiguel</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci</source>
            <pubdate>2003</pubdate>
            <volume>100</volume>
            <fpage>12265</fpage>
            <lpage>12270</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">218747</pubid>
                  <pubid idtype="pmpid" link="fulltext">14530400</pubid>
                  <pubid idtype="doi">10.1073/pnas.1434476100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Genome size reduction through illegitimate recombination counteracts genome expansion in Arabidopsis</p>
            </title>
            <aug>
               <au>
                  <snm>Devos</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>JKM</fnm>
               </au>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <fpage>1075</fpage>
            <lpage>1079</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">186626</pubid>
                  <pubid idtype="pmpid" link="fulltext">12097344</pubid>
                  <pubid idtype="doi">10.1101/gr.132102</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>DNA rearrangement in orthologous Orp regions of the maize, rice and sorghum genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Ma</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>SanMiguel</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Lai</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Messing</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2005</pubdate>
            <volume>170</volume>
            <fpage>1209</fpage>
            <lpage>1220</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1451190</pubid>
                  <pubid idtype="pmpid" link="fulltext">15834137</pubid>
                  <pubid idtype="doi">10.1534/genetics.105.040915</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Sequence conservation of homeologous BACs and expression of homeologous genes in soybean (Glycine max L Merr)</p>
            </title>
            <aug>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Scheffler</snm>
                  <fnm>BE</fnm>
               </au>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2006</pubdate>
            <volume>174</volume>
            <fpage>1017</fpage>
            <lpage>1028</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1602103</pubid>
                  <pubid idtype="pmpid" link="fulltext">16888343</pubid>
                  <pubid idtype="doi">10.1534/genetics.105.055020</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Genome duplication, fractionation and the origin of regulatory novelty</p>
            </title>
            <aug>
               <au>
                  <snm>Langham</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Walsh</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Dunn</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ko</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Goff</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Freeling</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2004</pubdate>
            <volume>166</volume>
            <fpage>935</fpage>
            <lpage>945</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1470742</pubid>
                  <pubid idtype="pmpid" link="fulltext">15020478</pubid>
                  <pubid idtype="doi">10.1534/genetics.166.2.935</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Uneven chromosome contraction and expansion in the maize genome</p>
            </title>
            <aug>
               <au>
                  <snm>Bruggmann</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Bharti</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Gundlach</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Lai</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Pontaroli</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Haberer</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Fuks</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Du</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Raymond</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Estep</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Bennetzen</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Chan</snm>
                  <fnm>AP</fnm>
               </au>
               <au>
                  <snm>Rabinowicz</snm>
                  <fnm>PD</fnm>
               </au>
               <au>
                  <snm>Quackenbush</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Barbazuk</snm>
                  <fnm>WB</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Birren</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Nusbaum</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Rounsley</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mayer</snm>
                  <fnm>KFX</fnm>
               </au>
               <au>
                  <snm>Messing</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>1241</fpage>
            <lpage>1251</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1581433</pubid>
                  <pubid idtype="pmpid" link="fulltext">16902087</pubid>
                  <pubid idtype="doi">10.1101/gr.5338906</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Incongruent patterns of local and global genome size evolution in cotton</p>
            </title>
            <aug>
               <au>
                  <snm>Grover</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
               <au>
                  <snm>Wendel</snm>
                  <fnm>JF</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <fpage>1474</fpage>
            <lpage>1482</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">509256</pubid>
                  <pubid idtype="pmpid" link="fulltext">15256507</pubid>
                  <pubid idtype="doi">10.1101/gr.2673204</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Genome duplication in soybean (<it>Glycine </it>subgenus <it>soja</it>)</p>
            </title>
            <aug>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Polzin</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Labate</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Specht</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Brummer</snm>
                  <fnm>EC</fnm>
               </au>
               <au>
                  <snm>Olson</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Concibido</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Wilcox</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tamulonis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kochert</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Boerma</snm>
                  <fnm>HR</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>1996</pubdate>
            <volume>144</volume>
            <fpage>329</fpage>
            <lpage>338</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1207505</pubid>
                  <pubid idtype="pmpid" link="fulltext">8878696</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Mapping duplicate genes in soybean</p>
            </title>
            <aug>
               <au>
                  <snm>Lee</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Bush</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Specht</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>1999</pubdate>
            <volume>42</volume>
            <fpage>829</fpage>
            <lpage>836</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1139/gen-42-5-829</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Genome organization in dicots. II.<it>Arabidopsis </it>as a 'bridging species' to resolve genome evolution events among legumes</p>
            </title>
            <aug>
               <au>
                  <snm>Lee</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Grant</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Vallejos</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Theor Appl Genet</source>
            <pubdate>2001</pubdate>
            <volume>103</volume>
            <fpage>765</fpage>
            <lpage>773</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/s001220100658</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>Soybean genomics survey: BAC-end sequences near RFLP and SSR markers</p>
            </title>
            <aug>
               <au>
                  <snm>Marek</snm>
                  <fnm>LF</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Darnielle</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Grant</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Hanson</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Paz</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Huihuang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Denny</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Larson</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Foster-Hartnett</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Cooper</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Danesh</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Larsen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Schmidt</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Staggs</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Crow</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Retzel</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>2001</pubdate>
            <volume>44</volume>
            <fpage>572</fpage>
            <lpage>581</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1139/gen-44-4-572</pubid>
                  <pubid idtype="pmpid" link="fulltext">11550890</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>Comparative genomic analysis of sequences sampled from a small region on soybean <it>(Glycine max) </it>molecular linkage group G</p>
            </title>
            <aug>
               <au>
                  <snm>Foster-Hartnett</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Larsen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Danesh</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Denny</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Penuela</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>2002</pubdate>
            <volume>45</volume>
            <fpage>634</fpage>
            <lpage>645</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1139/g02-027</pubid>
                  <pubid idtype="pmpid" link="fulltext">12175066</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>Estimates of conserved microsynteny among the genomes of <it>Glycine max, Medicago truncatula </it>and <it>Arabidopsis thaliana</it></p>
            </title>
            <aug>
               <au>
                  <snm>Yan</snm>
                  <fnm>HH</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>D-J</fnm>
               </au>
               <au>
                  <snm>Larsen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Cook</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
            </aug>
            <source>Theor Appl Genet</source>
            <pubdate>2003</pubdate>
            <volume>106</volume>
            <fpage>1256</fpage>
            <lpage>1265</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">12748777</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Comparative physical mapping reveals features of microsynteny between <it>Glycine max, Medicago truncatula</it>, and <it>Arabidopsis thaliana</it></p>
            </title>
            <aug>
               <au>
                  <snm>Yan</snm>
                  <fnm>HH</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>D-J</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Cook</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>2004</pubdate>
            <volume>47</volume>
            <fpage>141</fpage>
            <lpage>155</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1139/g03-106</pubid>
                  <pubid idtype="pmpid" link="fulltext">15060611</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Widespread paleopolyploidy in model plant species inferred from age distributions of duplicate genes</p>
            </title>
            <aug>
               <au>
                  <snm>Blanc</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2004</pubdate>
            <volume>16</volume>
            <fpage>1667</fpage>
            <lpage>1678</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">514152</pubid>
                  <pubid idtype="pmpid" link="fulltext">15208399</pubid>
                  <pubid idtype="doi">10.1105/tpc.021345</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Mining EST databases to resolve evolutionary events in major crop species</p>
            </title>
            <aug>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Dixon</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Granger</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Grant</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Doyle</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>2004</pubdate>
            <volume>47</volume>
            <fpage>868</fpage>
            <lpage>876</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1139/g04-047</pubid>
                  <pubid idtype="pmpid" link="fulltext">15499401</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Diagnosing duplications, can it be done?</p>
            </title>
            <aug>
               <au>
                  <snm>Durand</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Hoberman</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Trends in Genet</source>
            <pubdate>2006</pubdate>
            <volume>22</volume>
            <fpage>156</fpage>
            <lpage>164</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1016/j.tig.2006.01.002</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>Chromosome numbers in the Phaseoleae (Fabaceae:Faboideae) and their relation to taxonomy</p>
            </title>
            <aug>
               <au>
                  <snm>Lackey</snm>
                  <fnm>JA</fnm>
               </au>
            </aug>
            <source>Am J Biol</source>
            <pubdate>1980</pubdate>
            <volume>3</volume>
            <fpage>0008.1</fpage>
            <lpage>0008.9</lpage>
         </bibl>
         <bibl id="B23">
            <title>
               <p>BAC FISH reveals segmental duplications within the Glycine max (soybean) genome</p>
            </title>
            <aug>
               <au>
                  <snm>Pagel</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Walling</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Jackson</snm>
                  <fnm>SA</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>2004</pubdate>
            <volume>47</volume>
            <fpage>764</fpage>
            <lpage>768</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1139/g04-025</pubid>
                  <pubid idtype="pmpid" link="fulltext">15284882</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Chromosome-level homeology in paleopolyploid soybean (<it>Glycine max</it>) revealed through integration of genetic and chromosome maps</p>
            </title>
            <aug>
               <au>
                  <snm>Walling</snm>
                  <fnm>JG</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Jackson</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2005</pubdate>
            <volume>172</volume>
            <fpage>1893</fpage>
            <lpage>1900</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1456260</pubid>
                  <pubid idtype="pmpid" link="fulltext">16361231</pubid>
                  <pubid idtype="doi">10.1534/genetics.105.051466</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>The FAD2 family of soybean: insights into the structural and functional divergence of a paleopolyploid genome</p>
            </title>
            <aug>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Scheffler</snm>
                  <fnm>BE</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>The Plant Genome, a Suppl. to Crop Sci</source>
            <pubdate>2007</pubdate>
            <volume>47</volume>
            <issue>S1</issue>
            <url>http://www.crops.org/genome/</url>
            <note>doi:10.2135/cropsci2005.07.0206tpg</note>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Toward a reference sequence of the soybean genome: a multiagency effort</p>
            </title>
            <aug>
               <au>
                  <snm>Jackson</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Rokshar</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Stacey</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Schmutz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Grimwood</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>The Plant Genome, a Suppl. to Crop Sci</source>
            <pubdate>2006</pubdate>
            <volume>46</volume>
            <issue>S1</issue>
            <url>http://www.crops.org/genome/</url>
            <note>doi:10.2135/cropsci2005.07.0206tpg</note>
         </bibl>
         <bibl id="B27">
            <title>
               <p>A soybean transcript map: gene distribution, haplotype and SNP analysis</p>
            </title>
            <aug>
               <au>
                  <snm>Choi</snm>
                  <fnm>I-Y</fnm>
               </au>
               <au>
                  <snm>Hyten</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Matukumalli</snm>
                  <fnm>LK</fnm>
               </au>
               <au>
                  <snm>Song</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Chaky</snm>
                  <fnm>JM</fnm>
               </au>
               <au>
                  <snm>Quigley</snm>
                  <fnm>CV</fnm>
               </au>
               <au>
                  <snm>Chase</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Lark</snm>
                  <fnm>KG</fnm>
               </au>
               <au>
                  <snm>Reiter</snm>
                  <fnm>RS</fnm>
               </au>
               <au>
                  <snm>Yoon</snm>
                  <fnm>M-S</fnm>
               </au>
               <au>
                  <snm>Hwang</snm>
                  <fnm>E-Y</fnm>
               </au>
               <au>
                  <snm>Yi</snm>
                  <fnm>S-I</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>van Tassell</snm>
                  <fnm>CP</fnm>
               </au>
               <au>
                  <snm>Specht</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Cregan</snm>
                  <fnm>PB</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2006</pubdate>
            <volume>176</volume>
            <fpage>685</fpage>
            <lpage>696</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1534/genetics.107.070821</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Legume genomes: more than peas in a pod</p>
            </title>
            <aug>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ellis</snm>
                  <fnm>YN</fnm>
               </au>
            </aug>
            <source>Curr Opin Plant Biol</source>
            <pubdate>2003</pubdate>
            <volume>6</volume>
            <fpage>199</fpage>
            <lpage>204</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S1369-5266(03)00006-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">12667879</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Highly syntenic regions in the genomes of soybean, <it>Medicago truncatula </it>and <it>Arabidopsis thaliana</it></p>
            </title>
            <aug>
               <au>
                  <snm>Mudge</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Cannon</snm>
                  <fnm>SB</fnm>
               </au>
               <au>
                  <snm>Kalo</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Oldroyd</snm>
                  <fnm>GED</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Town</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
            </aug>
            <source>BMC Plant Biology</source>
            <pubdate>2005</pubdate>
            <volume>5</volume>
            <fpage>15</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1201151</pubid>
                  <pubid idtype="pmpid" link="fulltext">16102170</pubid>
                  <pubid idtype="doi">10.1186/1471-2229-5-15</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <url>http://soybase.org/publication_data/Schlueter/GMaxGDB.html</url>
         </bibl>
         <bibl id="B31">
            <title>
               <p>Basecalling of automated sequencer traces using phred II. Error probabilities</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>186</fpage>
            <lpage>194</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521922</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Basecalling of automated sequencer traces using phred. I. Accuracy assessment</p>
            </title>
            <aug>
               <au>
                  <snm>Ewing</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hillier</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Wendl</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>175</fpage>
            <lpage>185</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521921</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>Phrap documentation</p>
            </title>
            <aug>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <pubdate>1999</pubdate>
            <url>http://www.phrap.org/phrap.docs.phrap.html</url>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Consed: a graphical tool for sequence finishing</p>
            </title>
            <aug>
               <au>
                  <snm>Gordon</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Abajian</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <fpage>195</fpage>
            <lpage>202</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">9521923</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <url>http://www.vmatch.de</url>
         </bibl>
         <bibl id="B36">
            <url>http://www.plantgdb.org/PlantGDB-cgi/GeneSeqer/PlantGDBgs.cgi</url>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Genes encoding pentatricopeptide (PPR) proteins are not conserved in location in plant genomes and may be subject to diversifying selection</p>
            </title>
            <aug>
               <au>
                  <snm>Geddy</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Brown</snm>
                  <fnm>GG</fnm>
               </au>
            </aug>
            <source>BMC Genomics</source>
            <pubdate>2007</pubdate>
            <volume>3</volume>
            <fpage>130</fpage>
            <lpage>142</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1186/1471-2164-8-130</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Combining evidence using p-values: application to sequence homology searches</p>
            </title>
            <aug>
               <au>
                  <snm>Bailey</snm>
                  <fnm>TL</fnm>
               </au>
               <au>
                  <snm>Gribskov</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>1998</pubdate>
            <volume>14</volume>
            <fpage>48</fpage>
            <lpage>54</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/bioinformatics/14.1.48</pubid>
                  <pubid idtype="pmpid" link="fulltext">9520501</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <url>http://www.soymap.org/data/misc/soy_repeats.fasta</url>
         </bibl>
         <bibl id="B40">
            <title>
               <p>Whole-genome shotgun assembly and analysis of the genome of <it>Fugu ribripes</it></p>
            </title>
            <aug>
               <au>
                  <snm>Aparicio</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Stupka</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Putnam</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Chia</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Dehal</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Christoffels</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Rash</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hoon</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Smit</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gelpke</snm>
                  <fnm>MDS</fnm>
               </au>
               <au>
                  <snm>Roach</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Oh</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ho</snm>
                  <fnm>IY</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Detter</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Verhoef</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Predki</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Tay</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lucas</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Richardson</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Edwards</snm>
                  <fnm>YJK</fnm>
               </au>
               <au>
                  <snm>Doggett</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Zharkikh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Tavtigian</snm>
                  <fnm>SV</fnm>
               </au>
               <au>
                  <snm>Pruss</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Barnstead</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Evans</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Baden</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Powell</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Glusman</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Rowen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Hood</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>YH</fnm>
               </au>
               <au>
                  <snm>Elgar</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Hawkins</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Venkatesh</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Rokhsar</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Brenner</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>297</volume>
            <fpage>1301</fpage>
            <lpage>1310</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1072104</pubid>
                  <pubid idtype="pmpid" link="fulltext">12142439</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B41">
            <title>
               <p>A comparison of whole-genome shotgun-derived mouse chromosome 16 and the human genome</p>
            </title>
            <aug>
               <au>
                  <snm>Mural</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>HO</fnm>
               </au>
               <au>
                  <snm>Miklos</snm>
                  <fnm>GL</fnm>
               </au>
               <au>
                  <snm>Wides</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Halpern</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>PW</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>GG</fnm>
               </au>
               <au>
                  <snm>Nadeau</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Holt</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Kodira</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Evangelista</snm>
                  <fnm>CC</fnm>
               </au>
               <au>
                  <snm>Gan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Heiman</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Merkulov</snm>
                  <fnm>GV</fnm>
               </au>
               <au>
                  <snm>Milshina</snm>
                  <fnm>NV</fnm>
               </au>
               <au>
                  <snm>Naik</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Qi</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Shue</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Xang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Ye</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yooseph</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Biddick</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Bolanos</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Dew</snm>
                  <fnm>IM</fnm>
               </au>
               <au>
                  <snm>Fasulo</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Flanigan</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Huson</snm>
                  <fnm>DH</fnm>
               </au>
               <au>
                  <snm>Dravitz</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Mobarry</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Reinert</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Remington</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>ZH</fnm>
               </au>
               <au>
                  <snm>Nusskern</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Lai</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Lei</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Yao</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Guan</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ji</snm>
                  <fnm>R-R</fnm>
               </au>
               <au>
                  <snm>Gu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Z-Y</fnm>
               </au>
               <au>
                  <snm>Zhong</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Xiao</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Chiang</snm>
                  <fnm>C-C</fnm>
               </au>
               <au>
                  <snm>Yandell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Amanatides</snm>
                  <fnm>PG</fnm>
               </au>
               <au>
                  <snm>Hladun</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Pratts</snm>
                  <fnm>EC</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Dodson</snm>
                  <fnm>KL</fnm>
               </au>
               <au>
                  <snm>Woodford</snm>
                  <fnm>KJ</fnm>
               </au>
               <au>
                  <snm>Evans</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Gropman</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Rusch</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Venter</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Houck</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>Tompkins</snm>
                  <fnm>DE</fnm>
               </au>
               <au>
                  <snm>Haynes</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Jacob</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Chin</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Dahlke</snm>
                  <fnm>CE</fnm>
               </au>
               <au>
                  <snm>Sanders</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Levitsky</snm>
                  <fnm>AA</fnm>
               </au>
               <au>
                  <snm>Majoros</snm>
                  <fnm>WH</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Xia</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Lopez</snm>
                  <fnm>Jr</fnm>
               </au>
               <au>
                  <snm>Donnelly</snm>
                  <fnm>MT</fnm>
               </au>
               <au>
                  <snm>Newman</snm>
                  <fnm>MH</fnm>
               </au>
               <au>
                  <snm>Glodek</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kraft</snm>
                  <fnm>CL</fnm>
               </au>
               <au>
                  <snm>Nodell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ali</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>An</snm>
                  <fnm>H-J</fnm>
               </au>
               <au>
                  <snm>Baldwin-Pitts</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Beeson</snm>
                  <fnm>KY</fnm>
               </au>
               <au>
                  <snm>Cai</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Carnes</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carver</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Caulk</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Center</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y-H</fnm>
               </au>
               <au>
                  <snm>Cheng</snm>
                  <fnm>M-L</fnm>
               </au>
               <au>
                  <snm>Coyne</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Crowder</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Danaher</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Davenport</snm>
                  <fnm>LB</fnm>
               </au>
               <au>
                  <snm>Desilets</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Dietz</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Doup</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Dullaghan</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ferriera</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fosler</snm>
                  <fnm>CR</fnm>
               </au>
               <au>
                  <snm>Gire</snm>
                  <fnm>HC</fnm>
               </au>
               <au>
                  <snm>Gluecksmann</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gocayne</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Gray</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hart</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Haynes</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hoover</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Howland</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ibegwam</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Jalali</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Johns</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Kline</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>MacCawley</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Magoon</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mann</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>May</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>McIntosh</snm>
                  <fnm>TC</fnm>
               </au>
               <au>
                  <snm>Mehta</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Moy</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Moy</snm>
                  <fnm>MC</fnm>
               </au>
               <au>
                  <snm>Murphy</snm>
                  <fnm>BJ</fnm>
               </au>
               <au>
                  <snm>Murphy</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Nuri</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Parker</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Prudhomme</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Puri</snm>
                  <fnm>VN</fnm>
               </au>
               <au>
                  <snm>Qureshi</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Raley</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Reardon</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Regier</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Rogers</snm>
                  <fnm>Y-HC</fnm>
               </au>
               <au>
                  <snm>Romblad</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Schutz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Scott</snm>
                  <fnm>JL</fnm>
               </au>
               <au>
                  <snm>Scott</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sitter</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Smallwood</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sprague</snm>
                  <fnm>AC</fnm>
               </au>
               <au>
                  <snm>Stewart</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Strong</snm>
                  <fnm>RV</fnm>
               </au>
               <au>
                  <snm>Suh</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Sylvester</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Thomas</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Tint</snm>
                  <fnm>NN</fnm>
               </au>
               <au>
                  <snm>Tsonis</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Windsor</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>MM</fnm>
               </au>
               <au>
                  <snm>Zaveri</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chaturvedi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Gabrielian</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Ke</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Subramanian</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Venber</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <fpage>1661</fpage>
            <lpage>1671</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1069193</pubid>
                  <pubid idtype="pmpid" link="fulltext">12040188</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B42">
            <title>
               <p>Analysis of segmental duplications and genome assembly in the mouse</p>
            </title>
            <aug>
               <au>
                  <snm>Bailey</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Church</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Ventura</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rocchi</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Eichler</snm>
                  <fnm>EE</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <fpage>789</fpage>
            <lpage>801</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">479105</pubid>
                  <pubid idtype="pmpid" link="fulltext">15123579</pubid>
                  <pubid idtype="doi">10.1101/gr.2238404</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B43">
            <title>
               <p>The sequence of the human genome</p>
            </title>
            <aug>
               <au>
                  <snm>Venter</snm>
                  <fnm>JC</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>PW</fnm>
               </au>
               <au>
                  <snm>Mural</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>GG</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>HO</fnm>
               </au>
               <au>
                  <snm>Yandell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Evans</snm>
                  <fnm>CA</fnm>
               </au>
               <au>
                  <snm>Holt</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Gocayne</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Amanatides</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ballew</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Huson</snm>
                  <fnm>DH</fnm>
               </au>
               <au>
                  <snm>Wortman</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Kodira</snm>
                  <fnm>CD</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>XH</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Skupski</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Subramanian</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Thomas</snm>
                  <fnm>PD</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Miklos</snm>
                  <fnm>GLG</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Broder</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Nadeau</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>McKusick</snm>
                  <fnm>VA</fnm>
               </au>
               <au>
                  <snm>Zinder</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Levine</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>Roberts</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Simon</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Slayman</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Hunkapiller</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Bolanos</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Dew</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Fasulo</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Flanigan</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Florea</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Halpern</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hannenhalli</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dravitz</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Levy</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mobarry</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Reinert</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Remington</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Abu-Threideh</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Beasley</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Biddick</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Bonazzi</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Brandon</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Cargill</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Chandramouliswaran</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Charlab</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Chaturvedi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Francesco</snm>
                  <fnm>VD</fnm>
               </au>
               <au>
                  <snm>Dunn</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Eilbeck</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Evangelista</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Gabrielian</snm>
                  <fnm>AE</fnm>
               </au>
               <au>
                  <snm>Gan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Ge</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Gong</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Gu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Guan</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Heiman</snm>
                  <fnm>TJ</fnm>
               </au>
               <au>
                  <snm>Higgins</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Ji</snm>
                  <fnm>R-R</fnm>
               </au>
               <au>
                  <snm>Ke</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Ketchum</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Lai</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Lei</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Liang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Lin</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Merkulov</snm>
                  <fnm>GV</fnm>
               </au>
               <au>
                  <snm>Milshina</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Moore</snm>
                  <fnm>HM</fnm>
               </au>
               <au>
                  <snm>Naik</snm>
                  <fnm>AK</fnm>
               </au>
               <au>
                  <snm>Narayan</snm>
                  <fnm>VA</fnm>
               </au>
               <au>
                  <snm>Neelam</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Nusskern</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Rusch</snm>
                  <fnm>DB</fnm>
               </au>
               <au>
                  <snm>Salzberg</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Shao</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Shue</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>ZY</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>J-H</fnm>
               </au>
               <au>
                  <snm>Wides</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Xiao</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Yan</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Yao</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Ye</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhan</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zhong</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Zhong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>SC</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Gilbert</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Baumhueter</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Spier</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Carter</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Cravchik</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Woodage</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ali</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>An</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Awe</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Baldwin</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Baden</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Barnstead</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Barrow</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Beeson</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Busam</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Carver</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Center</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cheng</snm>
                  <fnm>ML</fnm>
               </au>
               <au>
                  <snm>Curry</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Danaher</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Daven port</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Desilets</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Dietz</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dodson</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Doup</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Ferriera</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Garg</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Gluecksmann</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Hart</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Haynes</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Haynes</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Heiner</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Hladun</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hostin</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Houck</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Howland</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Ibegwam</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Johnson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kalush</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Kline</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Koduru</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Love</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mann</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>May</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>McCawley</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>McIntosh</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>McMullen</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Moy</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Moy</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Murphy</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Pfannkoch</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Pratts</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Puri</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Qureshi</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Reardon</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rodriguez</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Rogers</snm>
                  <fnm>Y-H</fnm>
               </au>
               <au>
                  <snm>Romblad</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Ruhfel</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Scott</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sitter</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Smallwood</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Stewart</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Strong</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Suh</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Thomas</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Tint</snm>
                  <fnm>NN</fnm>
               </au>
               <au>
                  <snm>Tse</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Vech</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wetter</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Williams</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Windsor</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Winn-Deen</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Zaveri</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zaveri</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Abril</snm>
                  <fnm>JF</fnm>
               </au>
               <au>
                  <snm>Guigo</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Campbell</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Sjolander</snm>
                  <fnm>KV</fnm>
               </au>
               <au>
                  <snm>Karlak</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kejariwal</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mi</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Lazareva</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Hatton</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Narechania</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Diemer</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Muruganujan</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Guo</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Sato</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Bafna</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Istrail</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lippert</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Schwartz</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Walenz</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Yooseph</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Allen</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Basu</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Baxendale</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Blick</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Caminha</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carnes-Stine</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Caulk</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Chiang</snm>
                  <fnm>Y-H</fnm>
               </au>
               <au>
                  <snm>Coyne</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Dahlke</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Mays</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Dombroski</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Donnelly</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ely</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Esparham</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fosler</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Gire</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Glanowski</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Glasser</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Glodek</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gorokhov</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Graham</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Gropman</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Harris</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Heil</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Henderson</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Hoover</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Jennings</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Jordan</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Jordan</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kasha</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kagan</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Kraft</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Levitsky</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Lopez</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ma</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Majoros</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>McDaniel</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Murphy</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Newman</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Nguyen</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Nguyen</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Nodell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Pan</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Peck</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Peterson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Rowe</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Sanders</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Scott</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Simpson</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Smith</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Sprague</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Stockwell</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Turner</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Venter</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Want</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Xia</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Zandieh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>X</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2001</pubdate>
            <volume>291</volume>
            <fpage>1304</fpage>
            <lpage>1351</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1058040</pubid>
                  <pubid idtype="pmpid" link="fulltext">11181995</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B44">
            <title>
               <p>Whole-genome shotgun assembly and comparison of human genome assemblies</p>
            </title>
            <aug>
               <au>
                  <snm>Istrail</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>GG</fnm>
               </au>
               <au>
                  <snm>Florea</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Halpern</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Mobarry</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Lippert</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Walenz</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Shatkay</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Dew</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>Flanigan</snm>
                  <fnm>MJ</fnm>
               </au>
               <au>
                  <snm>Edwards</snm>
                  <fnm>NJ</fnm>
               </au>
               <au>
                  <snm>Bolanos</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Fasulo</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Halldorsson</snm>
                  <fnm>BV</fnm>
               </au>
               <au>
                  <snm>Hannenhalli</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Turner</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Yooseph</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Nusskern</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Shue</snm>
                  <fnm>BX</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>XH</fnm>
               </au>
               <au>
                  <snm>Zhong</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Delcher</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Huson</snm>
                  <fnm>DH</fnm>
               </au>
               <au>
                  <snm>Dravitz</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Mouchard</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Reinert</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Remington</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>AG</fnm>
               </au>
               <au>
                  <snm>Waterman</snm>
                  <fnm>MS</fnm>
               </au>
               <au>
                  <snm>Eichler</snm>
                  <fnm>EE</fnm>
               </au>
               <au>
                  <snm>Adams</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Hunkapiller</snm>
                  <fnm>MW</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Venter</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci</source>
            <pubdate>2004</pubdate>
            <volume>101</volume>
            <fpage>1916</fpage>
            <lpage>1921</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">357027</pubid>
                  <pubid idtype="pmpid" link="fulltext">14769938</pubid>
                  <pubid idtype="doi">10.1073/pnas.0307971100</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B45">
            <title>
               <p>Shotgun sequence assembly and recent segmental duplications within the human genome</p>
            </title>
            <aug>
               <au>
                  <snm>She</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Jiang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Clark</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Cheng</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Tuzun</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Church</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>Sutton</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Halpern AL Eichler</snm>
                  <fnm>EE</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2004</pubdate>
            <volume>431</volume>
            <fpage>927</fpage>
            <lpage>930</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03062</pubid>
                  <pubid idtype="pmpid" link="fulltext">15496912</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B46">
            <title>
               <p>Genome assembly comparison identifies structural variants in the human genome</p>
            </title>
            <aug>
               <au>
                  <snm>Khaja</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Macdonald</snm>
                  <fnm>JR</fnm>
               </au>
               <au>
                  <snm>He</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Joseph-George</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Wei</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Rafiq</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Qian</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Shago</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Pantano</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Aburatani</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Redon</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hurles</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Armengol</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Estivill</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Mural</snm>
                  <fnm>RJ</fnm>
               </au>
               <au>
                  <snm>Lee</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Scherer</snm>
                  <fnm>SW</fnm>
               </au>
               <au>
                  <snm>Feuk</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>2006</pubdate>
            <volume>38</volume>
            <fpage>1413</fpage>
            <lpage>8</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/ng1921</pubid>
                  <pubid idtype="pmpid" link="fulltext">17115057</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B47">
            <title>
               <p>Whole genome computational comparative genomics: A fruitful approach for ascertaining Alu insertion polymorphisms</p>
            </title>
            <aug>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Song</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Gonder</snm>
                  <fnm>MK</fnm>
               </au>
               <au>
                  <snm>Azrak</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ray</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Batzer</snm>
                  <fnm>MA</fnm>
               </au>
               <au>
                  <snm>Tishkoff</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Liang</snm>
                  <fnm>P</fnm>
               </au>
            </aug>
            <source>Gene</source>
            <pubdate>2006</pubdate>
            <volume>365</volume>
            <fpage>11</fpage>
            <lpage>20</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1847407</pubid>
                  <pubid idtype="pmpid" link="fulltext">16376498</pubid>
                  <pubid idtype="doi">10.1016/j.gene.2005.09.031</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B48">
            <title>
               <p>A draft sequence of the rice genome (Oryza sativa L. spp. indica)</p>
            </title>
            <aug>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wong G</snm>
                  <fnm>K-S</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Dai</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Cao</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Lin</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Ye</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Tong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Cong</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Geng</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Han</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Qi</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Lu</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Wu</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Ni</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Han</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Ren</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Feng</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Cui</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Zhai</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>He</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Xu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zeng</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Tao</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Ye</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tan</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ren</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>He</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Tian</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Tian</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Xia</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Bao</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Gao</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Cao</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhao</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Xiong</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Mao</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Hao</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Guo</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Tao</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhu</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Yuan</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <fpage>79</fpage>
            <lpage>92</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1068037</pubid>
                  <pubid idtype="pmpid" link="fulltext">11935017</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B49">
            <title>
               <p>A draft sequence of the rice genome (<it>Oryza sativa </it>L. spp. Japonica)</p>
            </title>
            <aug>
               <au>
                  <snm>Goff</snm>
                  <fnm>SA</fnm>
               </au>
               <au>
                  <snm>Ricke</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Lan</snm>
                  <fnm>T-H</fnm>
               </au>
               <au>
                  <snm>Presting</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Dunn</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Glazebrook</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Sessions</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Oeller</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Varma</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Hadley</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Hutchison</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Katagiri</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Lange</snm>
                  <fnm>BM</fnm>
               </au>
               <au>
                  <snm>Moughamer</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Xia</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Budworth</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Zhong</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Miguel</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Paszkowski</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Colbert</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sun</snm>
                  <fnm>W-L</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Cooper</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Park</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wood</snm>
                  <fnm>TC</fnm>
               </au>
               <au>
                  <snm>Mao</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Quail</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Dean</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Yu</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zharkikh</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Shen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Sahasrabudhe</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Thomas</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Cannings</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Gutin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Pruss</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Reid</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Tavtigian</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Mitchell</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Eldredge</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Scholl</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>RM</fnm>
               </au>
               <au>
                  <snm>Bhatnagar</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Adey</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Rubano</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Tusneem</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Robinson</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Feldhaus</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Macalma</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Oliphant</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Briggs</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <fpage>92</fpage>
            <lpage>100</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1068275</pubid>
                  <pubid idtype="pmpid" link="fulltext">11935018</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B50">
            <title>
               <p>Comparing the whole-genome-shotgun and map-based sequences of the rice genome</p>
            </title>
            <aug>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ni</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>GK-S</fnm>
               </au>
            </aug>
            <source>Trends Plant Sci</source>
            <volume>11</volume>
            <fpage>387</fpage>
            <lpage>391</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/j.tplants.2006.06.005</pubid>
                  <pubid idtype="pmpid" link="fulltext">16843033</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B51">
            <title>
               <p>Paleopolyploidy and gene duplication in soybean and other legumes</p>
            </title>
            <aug>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>JA</fnm>
               </au>
               <au>
                  <snm>Doyle</snm>
                  <fnm>JJ</fnm>
               </au>
            </aug>
            <source>Current Opin Plant Biol</source>
            <pubdate>2006</pubdate>
            <volume>9</volume>
            <fpage>104</fpage>
            <lpage>109</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1016/j.pbi.2006.01.007</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B52">
            <title>
               <p>Analysis of the genome sequence of the flowering plant <it>Arabidopsis thaliana</it></p>
            </title>
            <aug>
               <au>
                  <cnm>The <it>Arabidopsis </it>Genome Initiative</cnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2000</pubdate>
            <volume>408</volume>
            <fpage>796</fpage>
            <lpage>815</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/35048692</pubid>
                  <pubid idtype="pmpid" link="fulltext">11130711</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B53">
            <title>
               <p>Ancestral genome duplication in rice</p>
            </title>
            <aug>
               <au>
                  <snm>Guyot</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Keller</snm>
                  <fnm>B</fnm>
               </au>
            </aug>
            <source>Genome</source>
            <pubdate>2004</pubdate>
            <volume>47</volume>
            <fpage>610</fpage>
            <lpage>614</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1139/g04-016</pubid>
                  <pubid idtype="pmpid" link="fulltext">15190378</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B54">
            <title>
               <p>Buffering of crucial functions by paleologous duplicated gene may contribute cyclicality to angiosperm genome duplication</p>
            </title>
            <aug>
               <au>
                  <snm>Chapman</snm>
                  <fnm>BA</fnm>
               </au>
               <au>
                  <snm>Bowers</snm>
                  <fnm>JE</fnm>
               </au>
               <au>
                  <snm>Feltus</snm>
                  <fnm>FA</fnm>
               </au>
               <au>
                  <snm>Paterson</snm>
                  <fnm>AH</fnm>
               </au>
            </aug>
            <source>PNAS</source>
            <pubdate>2006</pubdate>
            <volume>103</volume>
            <fpage>2730</fpage>
            <lpage>2735</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1413778</pubid>
                  <pubid idtype="pmpid" link="fulltext">16467140</pubid>
                  <pubid idtype="doi">10.1073/pnas.0507782103</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B55">
            <title>
               <p>The genome of black cottonwood, <it>Populus trichocarpa </it>(Torr &amp; Gray)</p>
            </title>
            <aug>
               <au>
                  <snm>Tuskan</snm>
                  <fnm>GA</fnm>
               </au>
               <au>
                  <snm>DiFazio</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Jansson</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Bohlmann</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Grigoriev</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Hellsten</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Putnam</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Ralph</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Rombauts</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Salamov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Schein</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Sterck</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Aerts</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Bhalerao</snm>
                  <fnm>RR</fnm>
               </au>
               <au>
                  <snm>Bhalerao</snm>
                  <fnm>RP</fnm>
               </au>
               <au>
                  <snm>Blaudez</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Boerjan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Brun</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Brunner</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Busov</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Campbell</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Carlson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chalot</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Chapman</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Chen</snm>
                  <fnm>G-L</fnm>
               </au>
               <au>
                  <snm>Cooper</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Coutinho</snm>
                  <fnm>PM</fnm>
               </au>
               <au>
                  <snm>Couturier</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Covert</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Cronk</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Cunningham</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Davis</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Degroeve</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Dejardin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>dePamphilis</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Detter</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Dirks</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Dubchak</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Duplessis</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Ehiting</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ellis</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Gendler</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Goodstein</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Gribskov</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Grimwood</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Groover</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Gunter</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Hamberger</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Heinze</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Helariutta</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Henrissat</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Holligan</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Holt</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Huang</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Islam-Faridi</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Jones-Rhoades</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Jorgensen</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Joshi</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Kangasjarvi</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Karlsson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Kelleher</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Kirkpatrick</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Kirst</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Kohler</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kalluri</snm>
                  <fnm>U</fnm>
               </au>
               <au>
                  <snm>Larimer</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Leebens-Mack</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Peple</snm>
                  <fnm>J-C</fnm>
               </au>
               <au>
                  <snm>Locascio</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Lou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Lucas</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Montanini</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Napoli</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>DR</fnm>
               </au>
               <au>
                  <snm>Nelson</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Nieminen</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Nilsson</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Pereda</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Peter</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Philippe</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Pilate</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Poliakov</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Razumovskaya</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Richardson</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Rinaldi</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Ritland</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Rouze</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Ryaboy</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Schmutz</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Schrader</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Segerman</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Shin</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Siddiqui</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Sterky</snm>
                  <fnm>F</fnm>
               </au>
               <au>
                  <snm>Terry</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Tsai</snm>
                  <fnm>C-J</fnm>
               </au>
               <au>
                  <snm>Uberbacher</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Unneberg</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Vahala</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wall</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wessler</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Yin</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Douglas</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Marra</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Sandberg</snm>
                  <fnm>G</fnm>
               </au>
               <au>
                  <snm>Van de Peer</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Rokhsar</snm>
                  <fnm>D</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2006</pubdate>
            <volume>313</volume>
            <fpage>1596</fpage>
            <lpage>1604</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1128691</pubid>
                  <pubid idtype="pmpid" link="fulltext">16973872</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B56">
            <title>
               <p>Molecular and cytogenetic characterization of gene-poor, heterochromatic regions of <it>Glycine max </it>L. Merr</p>
            </title>
            <aug>
               <au>
                  <snm>Lin</snm>
                  <fnm>J-Y</fnm>
               </au>
               <au>
                  <snm>Hass-Jacobus</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>SanMiguel</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Walling</snm>
                  <fnm>JG</fnm>
               </au>
               <au>
                  <snm>Yuan</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Doyle</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
               <au>
                  <snm>Young</snm>
                  <fnm>ND</fnm>
               </au>
               <au>
                  <snm>Jackson</snm>
                  <fnm>SA</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2005</pubdate>
            <volume>170</volume>
            <fpage>1221</fpage>
            <lpage>1230</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1451161</pubid>
                  <pubid idtype="pmpid" link="fulltext">15879505</pubid>
                  <pubid idtype="doi">10.1534/genetics.105.041616</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B57">
            <title>
               <p>Doubling genome size without polyploidization: dynamics of retrotransposition-driven genomic expansions in <it>Oryza australiensis</it>, a wild relative of rice</p>
            </title>
            <aug>
               <au>
                  <snm>Piegu</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Guyot</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Picault</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Roulin</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Saniyal</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Kim</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Collura</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Brar</snm>
                  <fnm>DS</fnm>
               </au>
               <au>
                  <snm>Jackson</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wing</snm>
                  <fnm>RA</fnm>
               </au>
               <au>
                  <snm>Panaud</snm>
                  <fnm>O</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2006</pubdate>
            <volume>16</volume>
            <fpage>1262</fpage>
            <lpage>1269</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1581435</pubid>
                  <pubid idtype="pmpid" link="fulltext">16963705</pubid>
                  <pubid idtype="doi">10.1101/gr.5290206</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B58">
            <title>
               <p>Basic local alignment search tool</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Gish</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1990</pubdate>
            <volume>215</volume>
            <fpage>403</fpage>
            <lpage>410</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">2231712</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B59">
            <title>
               <p>Shotgun cloning as the strategy for choice to generate templates for high-throughput dideoxynucleotide sequencing</p>
            </title>
            <aug>
               <au>
                  <snm>Bodenteich</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Chissoe</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Wan</snm>
                  <fnm>YF</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Automated DNA sequencing and analysis techniques</source>
            <publisher>Academic Press, London</publisher>
            <editor>Venter JC</editor>
            <pubdate>1993</pubdate>
            <fpage>42</fpage>
            <lpage>50</lpage>
         </bibl>
         <bibl id="B60">
            <title>
               <p>The complete nucleotide sequence of the SacBII domain of the P1 pAD10-SacBII Cloning vetor and three cosmid cloning vectors: pTCF, svPHEP, and LAWRIST16</p>
            </title>
            <aug>
               <au>
                  <snm>Pan</snm>
                  <fnm>HQ</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Chissoe</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Bodenteich</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Iyer</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Chifton</snm>
                  <fnm>SW</fnm>
               </au>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>JS</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>GATA</source>
            <pubdate>1994</pubdate>
            <volume>11</volume>
            <fpage>181</fpage>
            <lpage>186</lpage>
         </bibl>
         <bibl id="B61">
            <aug>
               <au>
                  <snm>Roe</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Khan</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>DNA isolation and sequencing: essential techniques series</source>
            <publisher>J. Wiley and Sons, NY</publisher>
            <pubdate>1996</pubdate>
         </bibl>
         <bibl id="B62">
            <title>
               <p>Sequence and analysis of the human ABL gene, the BCR gene, and regions involved in the Philadelphia chromosomal translocation</p>
            </title>
            <aug>
               <au>
                  <snm>Chissoe</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Bodenteich</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>YF</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>YP</fnm>
               </au>
               <au>
                  <snm>Burian</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Clifton</snm>
                  <fnm>SW</fnm>
               </au>
               <au>
                  <snm>Crabtree</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Freeman</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Iyer</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Yichen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Hei-Jen</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Qua-Qin</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Sarhan</snm>
                  <fnm>OH</fnm>
               </au>
               <au>
                  <snm>Toth</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Zhili</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Guozhong</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Heisterkamp</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Groffen</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Roe</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>1995</pubdate>
            <volume>27</volume>
            <fpage>67</fpage>
            <lpage>82</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1006/geno.1995.1008</pubid>
                  <pubid idtype="pmpid" link="fulltext">7665185</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B63">
            <title>
               <p>Shotgun library transcription for DNA sequencing</p>
            </title>
            <aug>
               <au>
                  <snm>Roe</snm>
                  <fnm>BA</fnm>
               </au>
            </aug>
            <source>Methods in molecular biology, vol 255: bacterial artificial chromosomes, volume 1: library transcription, physical mapping, and sequencing</source>
            <publisher>Human Press Inc., Totowa, NJ</publisher>
            <editor>Zhao X, Stodolsky M</editor>
            <pubdate>2004</pubdate>
            <fpage>171</fpage>
            <lpage>187</lpage>
         </bibl>
         <bibl id="B64">
            <title>
               <p>RFLP analysis of soybean seed protein and oil content</p>
            </title>
            <aug>
               <au>
                  <snm>Diers</snm>
                  <fnm>BW</fnm>
               </au>
               <au>
                  <snm>Keim</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Fehr</snm>
                  <fnm>WR</fnm>
               </au>
               <au>
                  <snm>Shoemaker</snm>
                  <fnm>RC</fnm>
               </au>
            </aug>
            <source>Theoret Appl Genet</source>
            <pubdate>1992</pubdate>
            <volume>83</volume>
            <fpage>608</fpage>
            <lpage>612</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1007/BF00226905</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B65">
            <title>
               <p>MAPMAKER: an interactive computer package for transcripting primary genetic linkage maps of experimental and natural populations</p>
            </title>
            <aug>
               <au>
                  <snm>Lander</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Green</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Abrahamson</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Barlow</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Daly</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Lincoln</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Newberg</snm>
                  <fnm>L</fnm>
               </au>
            </aug>
            <source>Genomics</source>
            <pubdate>1987</pubdate>
            <volume>1</volume>
            <fpage>174</fpage>
            <lpage>181</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/0888-7543(87)90010-3</pubid>
                  <pubid idtype="pmpid" link="fulltext">3692487</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B66">
            <title>
               <p>yrGATE: a web-based gene-structure annotation tool for the identification and dissemination of eukaryotic genes</p>
            </title>
            <aug>
               <au>
                  <snm>Wilkerson</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Brendel</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Genome Biology</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>R58</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1779557</pubid>
                  <pubid idtype="pmpid" link="fulltext">16859520</pubid>
                  <pubid idtype="doi">10.1186/gb-2006-7-7-r58</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B67">
            <title>
               <p>xGDB: open-source computational infrastructure for the integrated evaluation and analysis of genome features</p>
            </title>
            <aug>
               <au>
                  <snm>Schlueter</snm>
                  <fnm>SD</fnm>
               </au>
               <au>
                  <snm>Wilkerson</snm>
                  <fnm>MD</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>Q</fnm>
               </au>
               <au>
                  <snm>Brendel</snm>
                  <fnm>V</fnm>
               </au>
            </aug>
            <source>Genome Biology</source>
            <pubdate>2006</pubdate>
            <volume>7</volume>
            <fpage>R111</fpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1794590</pubid>
                  <pubid idtype="pmpid" link="fulltext">17116260</pubid>
                  <pubid idtype="doi">10.1186/gb-2006-7-11-r111</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B68">
            <title>
               <p>Global alignment: finding rearrangements during alignment</p>
            </title>
            <aug>
               <au>
                  <snm>Brudno</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Malde</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Poliakov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Do</snm>
                  <fnm>CB</fnm>
               </au>
               <au>
                  <snm>Couronne</snm>
                  <fnm>O</fnm>
               </au>
               <au>
                  <snm>Dubchak</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Batzouglou</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Bioinformatics</source>
            <pubdate>2003</pubdate>
            <volume>19S1</volume>
            <fpage>i54</fpage>
            <lpage>i62</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1093/bioinformatics/btg1005</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B69">
            <title>
               <p>VISTA: computational tools for comparative genomics</p>
            </title>
            <aug>
               <au>
                  <snm>Frazer</snm>
                  <fnm>KA</fnm>
               </au>
               <au>
                  <snm>Pachter</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Poliakov</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Rubin</snm>
                  <fnm>EM</fnm>
               </au>
               <au>
                  <snm>Dubchak</snm>
                  <fnm>I</fnm>
               </au>
            </aug>
            <source>Nuc Acids Res</source>
            <pubdate>2004</pubdate>
            <volume>32</volume>
            <fpage>W273</fpage>
            <lpage>279</lpage>
            <xrefbib>
               <pubid idtype="doi">10.1093/nar/gkh458</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B70">
            <title>
               <p>EMBOSS: the European molecular biology open software suite</p>
            </title>
            <aug>
               <au>
                  <snm>Rice</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Longden</snm>
                  <fnm>I</fnm>
               </au>
               <au>
                  <snm>Bleasby</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Trends Genet</source>
            <pubdate>2000</pubdate>
            <volume>16</volume>
            <fpage>276</fpage>
            <lpage>277</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0168-9525(00)02024-2</pubid>
                  <pubid idtype="pmpid" link="fulltext">10827456</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B71">
            <title>
               <p>PAML: a program package for phylogenetic analysis by maximum likelihood</p>
            </title>
            <aug>
               <au>
                  <snm>Yang</snm>
                  <fnm>Z</fnm>
               </au>
            </aug>
            <source>Comput Appl Biosci</source>
            <pubdate>1997</pubdate>
            <volume>13</volume>
            <fpage>555</fpage>
            <lpage>6</lpage>
            <xrefbib>
               <pubid idtype="pmpid">9367129</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B72">
            <url>http://www.ncbi.nlm.nih.gov/Traces/trace.cgi?</url>
         </bibl>
      </refgrp>
   </bm>
</art>
