<?xml version='1.0'?>
<!DOCTYPE art SYSTEM 'http://www.biomedcentral.com/xml/article.dtd'>
<art>
   <ui>1471-2164-9-93</ui>
   <ji>1471-2164</ji>
   <fm>
      <dochead>Research article</dochead>
      <bibl>
         <title>
            <p>Gene conversion in the rice genome</p>
         </title>
         <aug>
            <au id="A1" ce="yes">
               <snm>Xu</snm>
               <fnm>Shuqing</fnm>
               <insr iid="I1"/>
               <insr iid="I7"/>
               <insr iid="I8"/>
               <insr iid="I9"/>
               <email>shuqing.xu@env.ethz.ch</email>
            </au>
            <au id="A2" ce="yes">
               <snm>Clark</snm>
               <fnm>Terry</fnm>
               <insr iid="I1"/>
               <insr iid="I2"/>
               <email>kedali@gmail.com</email>
            </au>
            <au id="A3" ce="yes">
               <snm>Zheng</snm>
               <fnm>Hongkun</fnm>
               <insr iid="I1"/>
               <insr iid="I3"/>
               <email>zhenghk@genomics.org.cn</email>
            </au>
            <au id="A4" ce="yes">
               <snm>Vang</snm>
               <fnm>S&#248;ren</fnm>
               <insr iid="I4"/>
               <email>vang@ki.au.dk</email>
            </au>
            <au id="A5">
               <snm>Li</snm>
               <fnm>Ruiqiang</fnm>
               <insr iid="I1"/>
               <insr iid="I3"/>
               <email>lirq@genomics.org.cn</email>
            </au>
            <au id="A6">
               <snm>Wong</snm>
               <mnm>Ka-Shu</mnm>
               <fnm>Gane</fnm>
               <insr iid="I1"/>
               <insr iid="I5"/>
               <email>gane@ualberta.ca</email>
            </au>
            <au id="A7" ca="yes">
               <snm>Wang</snm>
               <fnm>Jun</fnm>
               <insr iid="I1"/>
               <insr iid="I3"/>
               <insr iid="I6"/>
               <email>wangj@genomics.org.cn</email>
            </au>
            <au id="A8" ca="yes">
               <snm>Zheng</snm>
               <fnm>Xiaoguang</fnm>
               <insr iid="I1"/>
               <email>zhengxg@genomics.org.cn</email>
            </au>
         </aug>
         <insg>
            <ins id="I1">
               <p>Beijing Institute of Genomics of Chinese Academy of Sciences, Beijing Genomics Institute, Beijing Proteomics Institute, Beijing 101300, China</p>
            </ins>
            <ins id="I2">
               <p>Department of Electrial Engineering and Computer Science, University of Kansas, Lawrence, KS 66046, USA</p>
            </ins>
            <ins id="I3">
               <p>Department of Biochemistry and Molecular Biology, University of Southern Denmark, DK-5230, Odense M, Denmark</p>
            </ins>
            <ins id="I4">
               <p>Research Unit for Molecular Medicine, Aarhus University Hospital and Faculty of Health Sciences, DK-8200 Aarhus N, Denmark</p>
            </ins>
            <ins id="I5">
               <p>Department of Biological Sciences and Department of Medicine, University of Alberta, Edmonton, Alberta, T6G 2E9, Canada</p>
            </ins>
            <ins id="I6">
               <p>The Institute of Human Genetics, University of Aarhus, DK-8000 Aarhus C, Denmark</p>
            </ins>
            <ins id="I7">
               <p>Kunming Institute of Zoology, Chinese Academy of Sciences, Kunming, 650223, China</p>
            </ins>
            <ins id="I8">
               <p>Graduate University of Chinese Academy of Sciences, Beijing, 100049, China</p>
            </ins>
            <ins id="I9">
               <p>Current address: Institute of Integrative Biology, ETH Zurich, 8092, Switzerland</p>
            </ins>
         </insg>
         <source>BMC Genomics</source>
         <issn>1471-2164</issn>
         <pubdate>2008</pubdate>
         <volume>9</volume>
         <issue>1</issue>
         <fpage>93</fpage>
         <url>http://www.biomedcentral.com/1471-2164/9/93</url>
         <xrefbib>
            <pubidlist>
               <pubid idtype="pmpid">18298833</pubid>
               <pubid idtype="doi">10.1186/1471-2164-9-93</pubid>
            </pubidlist>
         </xrefbib>
      </bibl>
      <history>
         <rec>
            <date>
               <day>16</day>
               <month>9</month>
               <year>2007</year>
            </date>
         </rec>
         <acc>
            <date>
               <day>25</day>
               <month>2</month>
               <year>2008</year>
            </date>
         </acc>
         <pub>
            <date>
               <day>25</day>
               <month>2</month>
               <year>2008</year>
            </date>
         </pub>
      </history>
      <cpyrt>
         <year>2008</year>
         <collab>Xu et al; licensee BioMed Central Ltd.</collab>
         <note>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<url>http://creativecommons.org/licenses/by/2.0</url>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</note>
      </cpyrt>
      <abs>
         <sec>
            <st>
               <p>Abstract</p>
            </st>
            <sec>
               <st>
                  <p>Background</p>
               </st>
               <p>Gene conversion causes a non-reciprocal transfer of genetic information between similar sequences. Gene conversion can both homogenize genes and recruit point mutations thereby shaping the evolution of multigene families. In the rice genome, the large number of duplicated genes increases opportunities for gene conversion.</p>
            </sec>
            <sec>
               <st>
                  <p>Results</p>
               </st>
               <p>To characterize gene conversion in rice, we have defined 626 multigene families in which 377 gene conversions were detected using the GENECONV program. Over 60% of the conversions we detected were between chromosomes. We found that the inter-chromosomal conversions distributed between chromosome 1 and 5, 2 and 6, and 3 and 5 are more frequent than genome average (Z-test, P &lt; 0.05). The frequencies of gene conversion on the same chromosome decreased with the physical distance between gene conversion partners. Ka/Ks analysis indicates that gene conversion is not tightly linked to natural selection in the rice genome. To assess the contribution of segmental duplication on gene conversion statistics, we determined locations of conversion partners with respect to inter-chromosomal segment duplication. The number of conversions associated with segmentation is less than ten percent. Pseudogenes in the rice genome with low similarity to <it>Arabidopsis </it>genes showed greater likelihood for gene conversion than those with high similarity to <it>Arabidopsis </it>genes. Functional annotations suggest that at least 14 multigene families related to disease or bacteria resistance were involved in conversion events.</p>
            </sec>
            <sec>
               <st>
                  <p>Conclusion</p>
               </st>
               <p>The evolution of gene families in the rice genome may have been accelerated by conversion with pseudogenes. Our analysis suggests a possible role for gene conversion in the evolution of pathogen-response genes.</p>
            </sec>
         </sec>
      </abs>
   </fm>
   <bdy>
      <sec>
         <st>
            <p>Background</p>
         </st>
         <p>Gene conversion involves a non-reciprocal transfer of information between two homologous genes where one segment replaces nucleotides in its corresponding homolog. Gene conversion is generally considered a homogenization force on the genome, although it has two distinct consequences. In homogenization, gene conversion causes concerted evolution in gene families through reciprocal exchange of sequence between paralogs <abbrgrp><abbr bid="B1">1</abbr></abbrgrp>. However, diversification can occur, for example, when a pseudogene or otherwise unexpressed gene segment is transferred into another, functioning gene. Alteration of gene function through diversification can have advantageous consequences, such as in immune system diversification involving the major histocompatibility complex genes <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B3">3</abbr><abbr bid="B4">4</abbr></abbrgrp>.</p>
         <p>In eukaryotes, gene conversion has been classified into two types based on the conversion targets; one involves allele conversion and the other involves repeated genes. Conversion between alleles occurs at the same loci on sister-chromatids or between homologous chromosomes. Conversion events between repeated genes can occur at different loci on the same chromatid, sister-chromatids, homologous chromosomes, or non-homologous chromosomes <abbrgrp><abbr bid="B5">5</abbr></abbrgrp>. These events leave signatures in genome sequences that are detectable through specialized statistical analysis. In this study, we use such statistical methods with genome sequence data and annotations to study the gene conversion history of multigene families in the rice genome.</p>
         <p>Genome wide searches for gene conversion events between paralogs have been performed in yeast <abbrgrp><abbr bid="B6">6</abbr></abbrgrp>, <it>Caenorhabditis elegans </it><abbrgrp><abbr bid="B7">7</abbr></abbrgrp>, and mouse and rat <abbrgrp><abbr bid="B8">8</abbr></abbrgrp>. Significant evidence for gene conversion events has been detected on human chromosomes 21 and Y <abbrgrp><abbr bid="B9">9</abbr><abbr bid="B10">10</abbr><abbr bid="B11">11</abbr><abbr bid="B12">12</abbr></abbrgrp>. Analyses of selected regions of the <it>Arabidopsis thaliana </it>genome suggest that the divergence during the process of gene evolution is affected by gene conversion <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B14">14</abbr></abbrgrp>. However, prior to our work, no genome-wide conversion analysis has been reported for plants. As a result, little is known about how gene conversion influences the evolution of multigene families in plant genomes.</p>
         <p>The rice genome has evidence of ancient whole genome duplication, as well as recent chromosomal and segmental duplication <abbrgrp><abbr bid="B15">15</abbr><abbr bid="B16">16</abbr></abbrgrp>. Because of the increase in paralogs through duplication, the rice genome may have undergone potentially many gene-conversion and unequal-crossover events in its evolution. Studies of these events can enhance our understanding of evolutionary processes behind multigene families in the rice genome. Toward this end, we have mined the rice genome database <abbrgrp><abbr bid="B16">16</abbr></abbrgrp> for gene conversion traces.</p>
      </sec>
      <sec>
         <st>
            <p>Results</p>
         </st>
         <sec>
            <st>
               <p>Number and length of gene conversions detected in the rice genome</p>
            </st>
            <p>We analyzed a dataset of 626 multigene families, each family with at least three paralogs. In a total of 5274 genes, we detected 377 gene conversion events involving 513 genes in 189 families. Approximately 66% of these conversions involved sequences shorter than 100 nucleotides (Figure <figr fid="F1">1</figr>). The number of conversions identified by the detection algorithm declines rapidly as sequence length approaches zero. (See Methods for a description of the detection algorithm.) The average length of all conversions is 130 nucleotides and ranges from 4 to 1237 nucleotides. In general, the length distribution of converted regions in the rice genome is similar to those found in other species <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr></abbrgrp>. Short conversions with fewer than about 10 nucleotides are usually considered to be artifacts (Stanley Sawyer, personal communication). Our analysis included six conversion events involving match lengths with less than 10 nucleotides; although these six events have low reliability, their presence does not influence the interpretation of our results.</p>
            <fig id="F1">
               <title>
                  <p>Figure 1</p>
               </title>
               <caption>
                  <p>Distribution of gene conversion regions in the rice genome</p>
               </caption>
               <text>
                  <p><b>Distribution of gene conversion regions in the rice genome</b>. Sixty-nine percent of all regions are shorter than 100 nucleotides. The number of conversions decreases as conversion length decreases.</p>
               </text>
               <graphic file="1471-2164-9-93-1"/>
            </fig>
            <p>Gene conversion with pseudogenes may accelerate gene family evolution; in this model, pseudogenes are postulated as a source of genetic information. The introduction of genetic material from pseudogenes may lead to higher divergence in orthologs between rice and related species. To test this hypothesis, we established rice gene families as having either low similarity (LS) or high similarity (HS) to <it>Arabidopsis thaliana</it>. HS gene families are defined as having statistically significant sequence similarity to <it>Arabidopsis </it>genes. Conversely, LS gene families have low similarity to <it>Arabidopsis</it>. It follows that LS gene families are more likely to be rice specific.</p>
            <p>We categorized the 377 conversions detected in 50 LS and 327 HS gene families as described in Methods. Among the 377 conversion events, we identified those conversions involving pseudogenes in LS and HS families. The fraction of pseudogenes was approximately 56% in the LS families and 21% in the HS families (Table <tblr tid="T1">1</tblr>).</p>
            <tbl id="T1">
               <title>
                  <p>Table 1</p>
               </title>
               <caption>
                  <p>Genes with low similarity to <it>Arabidopsis </it>were found to have more gene-conversion events than genes with high similarity. * Fisher's Exact Test P value &lt; 0.01.</p>
               </caption>
               <tblbdy cols="4">
                  <r>
                     <c>
                        <p/>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Total</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>with pseudogenes</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Percent</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="4">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>LS</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>50</p>
                     </c>
                     <c ca="left">
                        <p>28*</p>
                     </c>
                     <c ca="left">
                        <p>56.0%</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>
                           <b>HS</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>327</p>
                     </c>
                     <c ca="left">
                        <p>70</p>
                     </c>
                     <c ca="left">
                        <p>21.4%</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>To rule out effects from assembly artifacts on our study, we performed a similar analysis on the <it>japonica </it>rice genome published by The International Rice Genome Sequencing Project (IRGSP) <abbrgrp><abbr bid="B17">17</abbr></abbrgrp>. The gene conversion characteristics were indistinguishable between the two assemblies (data not shown).</p>
         </sec>
         <sec>
            <st>
               <p>Distribution of conversion events on the chromosomes</p>
            </st>
            <p>Our analysis of the rice genome detected 513 genes likely to be involved in 377 conversion events. To determine the distribution of gene conversion across the genome, we mapped the converted genes to chromosomes (Table <tblr tid="T2">2</tblr>). We were also interested in chromosomes with more conversions than the average number of conversions per unit length. To assess this, we estimated that the average number of conversions per million nucleotides for the entire genome was ~1.361. Based on the average frequency of 1.361 conversions per megabase, the number of conversions was found to be relatively uniform as a function of length for each chromosome. In the 377 events, 148 conversion pairings occurred within the same chromosome (~39%) as intra-chromosomal conversions; 229 conversion events occurred between chromosomes (~61%) as inter-chromosomal conversions.</p>
            <tbl id="T2">
               <title>
                  <p>Table 2</p>
               </title>
               <caption>
                  <p>The number of genes involved in conversions on each chromosome compared to the estimated number based on chromosome length. The estimated number is the total number of conversions in the genome divided by the genome sequence length.</p>
               </caption>
               <tblbdy cols="3">
                  <r>
                     <c ca="left">
                        <p>
                           <b>Chromosome</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Genes with conversions</b>
                        </p>
                     </c>
                     <c ca="left">
                        <p>
                           <b>Estimated genes with conversions</b>
                        </p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr01</p>
                     </c>
                     <c ca="left">
                        <p>70</p>
                     </c>
                     <c ca="left">
                        <p>64.3</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr02</p>
                     </c>
                     <c ca="left">
                        <p>45</p>
                     </c>
                     <c ca="left">
                        <p>51.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr03</p>
                     </c>
                     <c ca="left">
                        <p>66</p>
                     </c>
                     <c ca="left">
                        <p>57.0</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr04</p>
                     </c>
                     <c ca="left">
                        <p>37</p>
                     </c>
                     <c ca="left">
                        <p>47.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr05</p>
                     </c>
                     <c ca="left">
                        <p>47</p>
                     </c>
                     <c ca="left">
                        <p>42.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr06</p>
                     </c>
                     <c ca="left">
                        <p>49</p>
                     </c>
                     <c ca="left">
                        <p>44.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr07</p>
                     </c>
                     <c ca="left">
                        <p>41</p>
                     </c>
                     <c ca="left">
                        <p>39.1</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr08</p>
                     </c>
                     <c ca="left">
                        <p>65</p>
                     </c>
                     <c ca="left">
                        <p>41.4</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr09</p>
                     </c>
                     <c ca="left">
                        <p>27</p>
                     </c>
                     <c ca="left">
                        <p>29.8</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr10</p>
                     </c>
                     <c ca="left">
                        <p>28</p>
                     </c>
                     <c ca="left">
                        <p>30.9</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr11</p>
                     </c>
                     <c ca="left">
                        <p>20</p>
                     </c>
                     <c ca="left">
                        <p>31.5</p>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Chr12</p>
                     </c>
                     <c ca="left">
                        <p>18</p>
                     </c>
                     <c ca="left">
                        <p>32.4</p>
                     </c>
                  </r>
                  <r>
                     <c cspan="3">
                        <hr/>
                     </c>
                  </r>
                  <r>
                     <c ca="left">
                        <p>Total</p>
                     </c>
                     <c ca="left">
                        <p>513</p>
                     </c>
                     <c ca="left">
                        <p>513</p>
                     </c>
                  </r>
               </tblbdy>
            </tbl>
            <p>From a total of 3844 gene pairs in the 626 multigene families, 2903 pairs were located on different chromosomes, with 941 pairs co-located on the same chromosome. It follows that the proportion of inter-chromosomal pairs involved in conversions was ~8% (229/2903), and intra-chromosomal pairs involved in conversions was ~16% (148/941). Although the number of inter-chromosomal conversion events was higher than intra-chromosomal conversion, the inter-chromosomal fraction was lower with respect to the potential for conversion based on total gene pairs. Thus, candidate pairs on the same chromosome apparently result in a higher likelihood for gene conversion. This does not necessarily represent an intrinsic bias for intra-chromosomal gene conversion; alternatively, it may represent an opportunistic positioning for gene conversion to occur.</p>
            <p>The 229 inter-chromosomal conversion events are distributed non-uniformly among the twelve chromosomes of the rice genome. The conversion events are significantly more frequent between chromosomes 1 and 5, 2 and 6, and 3 and 5 than the average (Z-test, P &lt; 0.05). The conversion distributions are shown in Figure <figr fid="F2">2</figr> for each chromosome.</p>
            <fig id="F2">
               <title>
                  <p>Figure 2</p>
               </title>
               <caption>
                  <p>Gene conversion distribution on the twelve rice chromosomes</p>
               </caption>
               <text>
                  <p><b>Gene conversion distribution on the twelve rice chromosomes</b>. The two genes in each gene pair identified in a conversion are connected with a line. The line thickness indicates the frequency of the gene conversion between the corresponding chromosomes. The highest inter-chromosomal conversion frequencies were detected between chromosomes 1 and 5, 2 and 6, and 3 and 5.</p>
               </text>
               <graphic file="1471-2164-9-93-2"/>
            </fig>
            <p>To determine the extent of segmental duplication on the observed conversion events, we compared conversion data with duplicated segments in the Beijing <it>indica </it>assembly <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>. For all 229 inter-chromosome conversion events, only 21 out of 229 (~9%) inter-chromosome conversion events were involved in the segmental duplications.</p>
         </sec>
         <sec>
            <st>
               <p>Conversion bias based on sequence similarity and orientation</p>
            </st>
            <p>To compare the sequence similarity of gene pairs involved in conversions to gene pairs not involved in conversions, we aligned entire gene sequences as described in Methods. The fraction of gene pairs involved in conversion events had significantly higher sequence similarity compared to all gene pairs (Figure <figr fid="F3">3</figr>). To test if the converted regions themselves influenced the higher similarity in the conversion group, we also calculated similarities of genes in conversion pairs, omitting the converted regions from the analysis. No significant difference was found between before and after omitting the converted regions (data not shown); the higher sequence similarity of gene pairs involved in conversion was not only a feature of the converted regions. In fact, most gene pairs not involved in conversions share statistically significant similarities in about 30&#8211;60% of their sequences with an average sequence similarity of 45%. In contrast, gene pairs involved in conversions exhibit a greater sequence similarity in the range of 60&#8211;80%. These results are consistent with findings that gene conversion is favored between similar genes <abbrgrp><abbr bid="B18">18</abbr></abbrgrp>.</p>
            <fig id="F3">
               <title>
                  <p>Figure 3</p>
               </title>
               <caption>
                  <p>Gene conversions are favored between similar genes</p>
               </caption>
               <text>
                  <p><b>Gene conversions are favored between similar genes</b>. Sequence similarities were calculated for homologs involved in gene conversions and for all homologs.</p>
               </text>
               <graphic file="1471-2164-9-93-3"/>
            </fig>
            <p>For the 148 intra-chromosomal conversions, the conversion frequency decreased with the physical distance between gene pairs along the chromosome (Figure <figr fid="F4">4</figr>). The gene pairs separated by less than 5 kb demonstrated the highest conversion frequency; these could be considered closely linked genes. For gene pairs separated by more than ~35 kb, conversion was infrequent.</p>
            <fig id="F4">
               <title>
                  <p>Figure 4</p>
               </title>
               <caption>
                  <p>Intra-chromosomal gene conversions frequencies</p>
               </caption>
               <text>
                  <p><b>Intra-chromosomal gene conversions frequencies</b>. The frequency of an intra-chromosomal conversion decreases as the distance between the gene pair increases.</p>
               </text>
               <graphic file="1471-2164-9-93-4"/>
            </fig>
            <p>The directions between gene pairs were also examined. Among the 3844 gene pairs, 2172 had the same direction and 1672 had reverse directions. In the 377 conversion events, 277 (60%) occurred between gene pairs with the same direction (See details in Additional File <supplr sid="S1">1</supplr>). The proportions of conversions with same-direction gene pairs (227/2172 = ~10%) and reverse-direction gene pairs (150/1672 = ~9%) were similar. The larger number of gene conversion events in the same direction coincides with the larger number of gene pairs in the same direction; however, from our data we cannot determine whether the conversion bias is an intrinsic preference.</p>
            <suppl id="S1">
               <title>
                  <p>Additional file 1</p>
               </title>
               <text>
                  <p>Annotation of genes involved in conversion events in rice genome. Detailed information of the 377 gene conversions in the rice genome including accession number, genomic location, length, direction and functional annotation.</p>
               </text>
               <file name="1471-2164-9-93-S1.xls">
                  <p>Click here for file</p>
               </file>
            </suppl>
         </sec>
         <sec>
            <st>
               <p>Evolutionary selection correlated to gene function</p>
            </st>
            <p>To determine if gene pairs involved in conversions are subject to evolutionary selection pressure, synonymous substitution rates (Ks) and non-synonymous substitution rates (Ka) were used. The Ka/Ks ratio can reflect the selection pressure between gene pairs caused by evolutionary processes. We calculated and compared the Ka/Ks ratios for two groups: (1) the closest homologs in each multigene family where at least one homolog was involved in gene conversion and (2) all close homologs in each multigene family (see Methods). The Ka/Ks profiles for the two groups were indistinguishable (data not shown).</p>
            <p>We assessed the function of genes involved in conversions using the protein <it>nr </it>database at NCBI <abbrgrp><abbr bid="B19">19</abbr></abbrgrp>. Although the function of many genes is presently unknown, we identified approximately14 gene families involved in conversions to be related to disease or bacteria resistance. These include genes coding for phospholipase D, cytochrome P450, receptor-like kinase and receptor kinase-like proteins. Some conversions were also found in related <it>Arabidopsis </it>gene families <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B20">20</abbr></abbrgrp>. (See details in Additional File <supplr sid="S1">1</supplr>). The highest conversion frequency was found in the phospholipase D (AK070203) gene family. Phospholipase D has been identified as an enzyme generating secondary messengers in plants, triggering defense against bacterial attacks <abbrgrp><abbr bid="B21">21</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Discussion</p>
         </st>
         <p>The proliferation of duplications during the evolution of the rice genome may have increased the potential for gene conversion and crossover events within multigene families through an increase in donor sequences. In our analysis of rice, the likelihood for gene conversion was found to be greater between pairs on the same chromosome than pairs on different chromosomes, even though more pairs were found for the latter case. The large number of duplicated repeats between chromosomes provides numerous opportunities for inter-chromosomal gene conversion. That only ~9% of gene conversion occurred between pairs involved in inter-chromosome segmental duplications indicates that the observed conversions were primarily from other sources.</p>
         <p>Our analysis considers fragments with uncharacteristically high similarity as candidates for gene conversion. High-similarity between fragments may also be caused by strong stabilizing selection. However, the fragments identified in gene conversion events are situated in spans of sequence flanked by sequence with low similarity. The low-similarity context suggests gene conversion and unequal crossing over as possible explanations for the high-similarity inner fragments.</p>
         <p>We mapped all identified conversions onto the rice genome sequence (Figure <figr fid="F2">2</figr>). The most frequent conversions were between chromosomes 1 and 5, 2 and 6, and 3 and 5. Our data show a decrease in intra-chromosomal gene conversion frequency as the distance between genes increase. This distance dependence corresponds to previous genome-wide studies of yeast <abbrgrp><abbr bid="B6">6</abbr><abbr bid="B7">7</abbr></abbrgrp>. In <it>C. elegans</it>, a high proportion of conversion was observed between tandemly duplicated members of gene families <abbrgrp><abbr bid="B7">7</abbr></abbrgrp>. The higher conversion frequency between genes with short separation on the same chromosome may be a consequence of a relationship between conversion and recombination. In <it>Arabidopsis</it>, it was found that the upper limit of pairwise distance between genes involved in conversion is 40 kb <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. This is similar to the value we found in the rice genome (Figure <figr fid="F4">4</figr>).</p>
         <p>Conversions involving pseudogenes could accelerate gene family evolution, and may accelerate divergence of some gene families relative to their orthologs. In this study, we found that pseudogenes are more prone to participate in gene conversion in the LS gene families than in HS gene families in the rice genome. Thus, conversion with pseudogenes in LS gene families may contribute to the acceleration of LS gene evolution. The rationale behind this is linked to the susceptibility of pseudogenes to accumulate mutations more rapidly than expressed genes, which may then be transferred to conversion partners. This may occur where pseudogene fragments are recruited into functional genes. By definition, LS genes have low similarity with <it>Arabidopsis</it>, which means LS gene families are potentially rice-specific. Based on this, we can postulate that inter-conversion with pseudogenes may be a source of rice-specific genes. A similar mechanism is suspected for some human speciation events <abbrgrp><abbr bid="B22">22</abbr></abbrgrp>. Moreover, our findings support the view that pseudogenes contain potential material for new genes <abbrgrp><abbr bid="B23">23</abbr></abbrgrp>.</p>
         <p>The question remains whether genes involved in conversions are subject to selective pressure that differs from non-converted genes. A mechanism has been suggested that favors selection of some gene clusters in the tomato plant exhibiting traces of gene conversion and conferring disease resistance <abbrgrp><abbr bid="B24">24</abbr></abbrgrp>. But does this occur in rice and is it genome wide? We calculated Ka and Ks values and their ratios for groups of gene with and without conversions &#8211; no differences were observed between the two groups. These similar Ka/Ks ratios may indicate that the genes involved in conversions were not subject to significant selective pressure. The indistinguishable Ka/Ks ratios of gene pairs involved in conversion imply that the genome-wide gene conversions were not tightly linked to selection pressure in the rice genome. As suggested by Mondragon-Palomino and Gaut, these indistinguishable Ka/Ks ratios may be a result of both methodological and biological influences <abbrgrp><abbr bid="B13">13</abbr></abbrgrp>. Inter-conversions through recombination and gene conversion may also influence the accuracy of Ka/Ks analysis <abbrgrp><abbr bid="B25">25</abbr></abbrgrp>. Although the co-occurrence of gene conversion and positive selection has been found in some studies, there is evidence that gene conversion is independent of positive selection <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B26">26</abbr></abbrgrp>.</p>
         <p>The diversification within gene families could be caused by conversion with variant paralogs <abbrgrp><abbr bid="B27">27</abbr></abbrgrp>. This mechanism has been widely observed in mammalian immune systems <abbrgrp><abbr bid="B2">2</abbr><abbr bid="B28">28</abbr><abbr bid="B29">29</abbr></abbrgrp>. In tomato and <it>Arabidopsis</it>, gene conversion has been detected in genes related to disease and bacteria resistance <abbrgrp><abbr bid="B13">13</abbr><abbr bid="B24">24</abbr></abbrgrp>. Our genome-wide analysis of rice identified at least fourteen such genes potentially influenced by gene conversion events. Some of these genes have counterparts in <it>Arabidopsis </it><abbrgrp><abbr bid="B13">13</abbr></abbrgrp>, while others were specific to rice. Our results contribute to the view that intergenic gene conversion can create variety within a gene family, providing a mechanism for the adaptive evolution, such as disease resistance <abbrgrp><abbr bid="B3">3</abbr></abbrgrp>. The diversified paralogs conferring disease resistance would be advantageous for adaptive reorganization and response to various diseases or bacteria.</p>
      </sec>
      <sec>
         <st>
            <p>Conclusion</p>
         </st>
         <p>We have detected 377 gene conversion events in the rice genome. The overall characteristics of gene conversion in the rice genome suggest influences by extensive duplication events throughout the evolution of rice. Our data further suggest that conversion with pseudogenes may have accelerated the evolution of multigene families. In particular, the adaptive evolution of disease resistance in rice may have been significantly influenced by gene conversion.</p>
      </sec>
      <sec>
         <st>
            <p>Methods</p>
         </st>
         <sec>
            <st>
               <p>Gene families</p>
            </st>
            <p>The initial 28,469 full-length rice cDNA sequences were downloaded from RIKEN and FAIS centers <abbrgrp><abbr bid="B30">30</abbr></abbrgrp>. We aligned these cDNAs to the <it>Oryza sativa indica </it>genome sequence using BLAT <abbrgrp><abbr bid="B31">31</abbr></abbrgrp>. We removed the following sequences: redundant genes, namely those that are the smaller cDNA of two alignments with overlap of at least 100 bp; unlikely protein coding genes with open reading frames less than 100 amino acids; and those sequences with more than 10% transposon-like content identified by using RepeatMasker with RepBase <abbrgrp><abbr bid="B32">32</abbr></abbrgrp>. Eventually, 13,089 reliable protein-coding genes were obtained <abbrgrp><abbr bid="B33">33</abbr></abbrgrp> and used as consensus sequences.</p>
            <p>Paralogs in the rice genome (Indica 9311) were identified based on similarity with the 13,089 reference protein sequences using BLAST <abbrgrp><abbr bid="B34">34</abbr></abbrgrp>. The pipeline used to identify paralogs is similar to the FGF approach <abbrgrp><abbr bid="B35">35</abbr></abbrgrp>. The reference protein sequence was defined as the consensus sequence for each family. The members of gene families were defined by alignments with at least 80% similarity over 70% of the corresponding consensus sequence. If the subject sequence exhibited significant similarity to more than one consensus protein, we considered only the highest-scoring match. The family members were aligned together with the consensus protein sequence using GeneWise <abbrgrp><abbr bid="B36">36</abbr></abbrgrp>.</p>
            <p>Families with more than two genes were defined as multigene families. In the 626 multigene families, we identified 3824 gene pairs; a gene pair is defined as one gene and its closest homolog in the same family. We defined high-similarity (HS) genes as those with a homolog in <it>Arabidopsis </it>and low-similarity (LS) as those without. LS genes and HS genes were identified based on tblastn searches using an E-value threshold of 10<sup>-7</sup>as previously reported <abbrgrp><abbr bid="B16">16</abbr></abbrgrp>, involving at least 50% of a given <it>Arabidopsis </it>protein or 100 amino acids. The cDNAs were aligned to protein sequences also using GeneWise. Those cDNAs containing multiple stop codons or frame-shift mutations were considered to be pseudogenes.</p>
         </sec>
         <sec>
            <st>
               <p>Detection of Gene Conversion Events</p>
            </st>
            <p>The aligned sequences within the multigene families were used to detect conversion events using the GENECONV program version 1.81 <abbrgrp><abbr bid="B37">37</abbr></abbrgrp>. This program detects pairs of sequences that share unusually long stretches of similarity in regions of overall lower similarity <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. The methods used by GENECONV make it difficult to detect conversion events as candidate region lengths approach zero, i.e., for very short sequences. For example, if a conversion event contains only 3 bp of information, we cannot confidently assert the criterion of unusually long stretches of similarity, a signature of gene conversion. Both global and pairwise P-values were calculated based on 1000 permutations of original data and a BLAST-like searching algorithm.</p>
            <p>We only used P-values from global fragments, which were multiple comparisons corrected for all possible sequence pairs. The g2 option provided by GENECONV was used to allow some accumulation of mutations in conversion regions following a candidate conversion event. With the g2 option, all multigene families that had global P-values less than 0.05 for inner fragments were considered as statistical significance requirement for conversion events; 215 of the detected pairs had P-values less than 0.01, and 162 had with P-value higher than 0.01 but less than 0.05. The inner fragment indicates a possible gene conversion event between ancestors of the two sequences in the alignment where the outer fragments have diverged.</p>
            <p>The lengths of the converted regions were also determined using the multiple-sequence alignment used by GENECONV. We removed the gaps involved in the conversion regions of both paralogs to compensate for multiple-sequence alignment effects thereby improving the length estimate for the conversion regions. The lengths were also checked manually against pairwise alignments using randomly selected pairs without a significant difference with our multiple-sequence alignment analysis.</p>
            <p>We compared all paralogs in each gene family. If the paralogs of a family shared more than 95% similarity, we only considered one of them as a conversion partner with other high-scoring alignments designated as members of the gene family. The goal of this step was to eliminate conversion copies resulting from subfamilies with recent duplications.</p>
         </sec>
         <sec>
            <st>
               <p>Similarity, direction, distance and evolutionary selection analysis</p>
            </st>
            <p>The similarities between gene pairs were estimated based on their cDNA sequences. Sequence alignments and similarity scores were calculated between all paralogs within each multigene family. The genes were mapped onto the genome sequence using TBLASTN; direction and distance between gene pairs were determined from the physical map. The expected number of genes involved in conversion events on each chromosome was estimated based on the length of chromosomes. In computing sequence similarity, we compared the sequences with and without the identified converted region to exclude the contribution of converted sequence to the overall score.</p>
            <p>Ka and Ks values of gene pairs were calculated using the LPB93 method <abbrgrp><abbr bid="B38">38</abbr></abbrgrp>. Ka/Ks ratios were compared between gene pairs for gene-conversion partners consisting of 3824 pairs in 626 multigene families. To increase the calculation sensitivity, gene pairs with Ks > 1 were removed because the Ka/Ks calculations by LPB93 may not be reliable for highly diverged gene pairs. Functional information for gene families involved in gene conversion were obtained from NCBI <abbrgrp><abbr bid="B39">39</abbr></abbrgrp>.</p>
         </sec>
      </sec>
      <sec>
         <st>
            <p>Abbreviations</p>
         </st>
         <p>LS, low similarity to <it>Arabidopsis; </it>HS, high similarity to <it>Arabidopsis; </it>IRGSP, International Rice Genome Sequencing Project.</p>
      </sec>
      <sec>
         <st>
            <p>Authors' contributions</p>
         </st>
         <p>SX and HZ conducted the analysis. SX, HZ, SV and TC wrote the manuscript. GKSW and RL participated in the data analysis. SX, HZ, JW and XZ designed the study. All authors read and approved the final manuscript.</p>
      </sec>
   </bdy>
   <bm>
      <ack>
         <sec>
            <st>
               <p>Acknowledgements</p>
            </st>
            <p>This project was supported by Chinese Academy of Sciences (KSCX2-YW-N-023; GJHZ0518), Ministry of Science and Technology under high-tech program 863 (2006AA02Z334; 2006AA10A121), Beijing Municipal Science and Technology Commission (D07030200740000), and National Natural Science Foundation of China (90608010; 90208019; 90403130; 30221004; 90612019; 30392130). Other support came from Ole R&#248;mer grants from the Danish Natural Science Research Council and the Danish Medical Research Council.</p>
         </sec>
      </ack>
      <refgrp>
         <bibl id="B1">
            <title>
               <p>The effect of gene conversion on the divergence between duplicated genes</p>
            </title>
            <aug>
               <au>
                  <snm>Teshima</snm>
                  <fnm>KM</fnm>
               </au>
               <au>
                  <snm>Innan</snm>
                  <fnm>H</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2004</pubdate>
            <volume>166</volume>
            <issue>3</issue>
            <fpage>1553</fpage>
            <lpage>1560</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1470786</pubid>
                  <pubid idtype="pmpid" link="fulltext">15082568</pubid>
                  <pubid idtype="doi">10.1534/genetics.166.3.1553</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B2">
            <title>
               <p>The Structure of a Mutant H-2-Gene Suggests That the Generation of Polymorphism in H-2 Genes May Occur by Gene Conversion-Like Events</p>
            </title>
            <aug>
               <au>
                  <snm>Weiss</snm>
                  <fnm>EH</fnm>
               </au>
               <au>
                  <snm>Mellor</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Golden</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Fahrner</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Simpson</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Hurst</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Flavell</snm>
                  <fnm>RA</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>1983</pubdate>
            <volume>301</volume>
            <issue>5902</issue>
            <fpage>671</fpage>
            <lpage>674</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/301671a0</pubid>
                  <pubid idtype="pmpid">6828150</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B3">
            <title>
               <p>The gene conversion hypothesis of MHC evolution: a review</p>
            </title>
            <aug>
               <au>
                  <snm>Martinsohn</snm>
                  <fnm>JT</fnm>
               </au>
               <au>
                  <snm>Sousa</snm>
                  <fnm>AB</fnm>
               </au>
               <au>
                  <snm>Guethlein</snm>
                  <fnm>LA</fnm>
               </au>
               <au>
                  <snm>Howard</snm>
                  <fnm>JC</fnm>
               </au>
            </aug>
            <source>Immunogenetics</source>
            <pubdate>1999</pubdate>
            <volume>50</volume>
            <issue>3&#8211;4</issue>
            <fpage>168</fpage>
            <lpage>200</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s002510050593</pubid>
                  <pubid idtype="pmpid" link="fulltext">10602879</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B4">
            <title>
               <p>Relative roles of mutation and recombination in generating allelic polymorphism at an MHC class II locus in Peromyseus maniculatus</p>
            </title>
            <aug>
               <au>
                  <snm>Richman</snm>
                  <fnm>AD</fnm>
               </au>
               <au>
                  <snm>Herrera</snm>
                  <fnm>LG</fnm>
               </au>
               <au>
                  <snm>Nash</snm>
                  <fnm>D</fnm>
               </au>
               <au>
                  <snm>Schierup</snm>
                  <fnm>MH</fnm>
               </au>
            </aug>
            <source>Genet Res</source>
            <pubdate>2003</pubdate>
            <volume>82</volume>
            <issue>2</issue>
            <fpage>89</fpage>
            <lpage>99</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1017/S0016672303006347</pubid>
                  <pubid idtype="pmpid">14768893</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B5">
            <title>
               <p>Recombination between Repeated Genes in Microorganisms</p>
            </title>
            <aug>
               <au>
                  <snm>Petes</snm>
                  <fnm>TD</fnm>
               </au>
               <au>
                  <snm>Hill</snm>
                  <fnm>CW</fnm>
               </au>
            </aug>
            <source>Annu Rev Genet</source>
            <pubdate>1988</pubdate>
            <volume>22</volume>
            <fpage>147</fpage>
            <lpage>168</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.ge.22.120188.001051</pubid>
                  <pubid idtype="pmpid" link="fulltext">3071247</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B6">
            <title>
               <p>Characterization of the gene conversions between the multigene family members of the yeast genome</p>
            </title>
            <aug>
               <au>
                  <snm>Drouin</snm>
                  <fnm>G</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>2002</pubdate>
            <volume>55</volume>
            <issue>1</issue>
            <fpage>14</fpage>
            <lpage>23</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/s00239-001-0085-y</pubid>
                  <pubid idtype="pmpid" link="fulltext">12165839</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B7">
            <title>
               <p>Gene duplication and gene conversion in the Caenorhabditis elegans genome</p>
            </title>
            <aug>
               <au>
                  <snm>Semple</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Wolfe</snm>
                  <fnm>KH</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>1999</pubdate>
            <volume>48</volume>
            <issue>5</issue>
            <fpage>555</fpage>
            <lpage>564</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/PL00006498</pubid>
                  <pubid idtype="pmpid" link="fulltext">10198121</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B8">
            <title>
               <p>Proceedings of the SMBE Tri-National Young Investigators' Workshop 2005. Genome-wide search of gene conversions in duplicated genes of mouse and rat</p>
            </title>
            <aug>
               <au>
                  <snm>Ezawa</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>S</snm>
                  <fnm>OO</fnm>
               </au>
               <au>
                  <snm>Saitou</snm>
                  <fnm>N</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2006</pubdate>
            <volume>23</volume>
            <issue>5</issue>
            <fpage>927</fpage>
            <lpage>940</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msj093</pubid>
                  <pubid idtype="pmpid" link="fulltext">16407460</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B9">
            <title>
               <p>Estimating the rate of gene conversion on human chromosome 21</p>
            </title>
            <aug>
               <au>
                  <snm>Padhukasahasram</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Marjoram</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Nordborg</snm>
                  <fnm>M</fnm>
               </au>
            </aug>
            <source>Am J Hum Genet</source>
            <pubdate>2004</pubdate>
            <volume>75</volume>
            <issue>3</issue>
            <fpage>386</fpage>
            <lpage>397</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1182018</pubid>
                  <pubid idtype="pmpid" link="fulltext">15250027</pubid>
                  <pubid idtype="doi">10.1086/423451</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B10">
            <title>
               <p>Intense and highly localized gene conversion activity in human meiotic crossover hot spots</p>
            </title>
            <aug>
               <au>
                  <snm>Jeffreys</snm>
                  <fnm>AJ</fnm>
               </au>
               <au>
                  <snm>May</snm>
                  <fnm>CA</fnm>
               </au>
            </aug>
            <source>Nat Genet</source>
            <pubdate>2004</pubdate>
            <volume>36</volume>
            <issue>2</issue>
            <fpage>151</fpage>
            <lpage>156</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/ng1287</pubid>
                  <pubid idtype="pmpid" link="fulltext">14704667</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B11">
            <title>
               <p>Abundant gene conversion between arms of palindromes in human and ape Y chromosomes</p>
            </title>
            <aug>
               <au>
                  <snm>Rozen</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Skaletsky</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Marszalek</snm>
                  <fnm>JD</fnm>
               </au>
               <au>
                  <snm>Minx</snm>
                  <fnm>PJ</fnm>
               </au>
               <au>
                  <snm>Cordum</snm>
                  <fnm>HS</fnm>
               </au>
               <au>
                  <snm>Waterston</snm>
                  <fnm>RH</fnm>
               </au>
               <au>
                  <snm>Wilson</snm>
                  <fnm>RK</fnm>
               </au>
               <au>
                  <snm>Page</snm>
                  <fnm>DC</fnm>
               </au>
            </aug>
            <source>Nature</source>
            <pubdate>2003</pubdate>
            <volume>423</volume>
            <issue>6942</issue>
            <fpage>873</fpage>
            <lpage>876</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature01723</pubid>
                  <pubid idtype="pmpid" link="fulltext">12815433</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B12">
            <title>
               <p>Dynamics of a human interparalog gene conversion hotspot</p>
            </title>
            <aug>
               <au>
                  <snm>Bosch</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Hurles</snm>
                  <fnm>ME</fnm>
               </au>
               <au>
                  <snm>Navarro</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Jobling</snm>
                  <fnm>MA</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2004</pubdate>
            <volume>14</volume>
            <issue>5</issue>
            <fpage>835</fpage>
            <lpage>844</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">479110</pubid>
                  <pubid idtype="pmpid" link="fulltext">15123583</pubid>
                  <pubid idtype="doi">10.1101/gr.2177404</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B13">
            <title>
               <p>Gene conversion and the evolution of three leucine-rich repeat gene families in Arabidopsis thaliana</p>
            </title>
            <aug>
               <au>
                  <snm>Mondragon-Palomino</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Gaut</snm>
                  <fnm>BS</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>2005</pubdate>
            <volume>22</volume>
            <issue>12</issue>
            <fpage>2444</fpage>
            <lpage>2456</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1093/molbev/msi241</pubid>
                  <pubid idtype="pmpid" link="fulltext">16120808</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B14">
            <title>
               <p>Recombination and gene conversion in a 170-kb genomic region of Arabidopsis thaliana</p>
            </title>
            <aug>
               <au>
                  <snm>Haubold</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Kroymann</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ratzka</snm>
                  <fnm>A</fnm>
               </au>
               <au>
                  <snm>Mitchell-Olds</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Wiehe</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2002</pubdate>
            <volume>161</volume>
            <issue>3</issue>
            <fpage>1269</fpage>
            <lpage>1278</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1462186</pubid>
                  <pubid idtype="pmpid" link="fulltext">12136029</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B15">
            <title>
               <p>A draft sequence of the rice genome (Oryza sativa L. ssp indica)</p>
            </title>
            <aug>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wong</snm>
                  <fnm>GKS</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>SG</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>B</fnm>
               </au>
               <au>
                  <snm>Deng</snm>
                  <fnm>YJ</fnm>
               </au>
               <au>
                  <snm>Dai</snm>
                  <fnm>L</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>XQ</fnm>
               </au>
               <etal/>
            </aug>
            <source>Science</source>
            <pubdate>2002</pubdate>
            <volume>296</volume>
            <issue>5565</issue>
            <fpage>79</fpage>
            <lpage>92</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1068037</pubid>
                  <pubid idtype="pmpid" link="fulltext">11935017</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B16">
            <title>
               <p>The Genomes of Oryza sativa: A history of duplications</p>
            </title>
            <aug>
               <au>
                  <snm>Yu</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Lin</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>SG</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Zhou</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ni</snm>
                  <fnm>PX</fnm>
               </au>
               <au>
                  <snm>Dong</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Hu</snm>
                  <fnm>SN</fnm>
               </au>
               <au>
                  <snm>Zeng</snm>
                  <fnm>CQ</fnm>
               </au>
               <etal/>
            </aug>
            <source>PLoS Biol</source>
            <pubdate>2005</pubdate>
            <volume>3</volume>
            <issue>2</issue>
            <fpage>e38</fpage>
            <lpage/>
            <note>Epub 2005 Feb 1.</note>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1371/journal.pbio.0030038</pubid>
                  <pubid idtype="pmpid" link="fulltext">15685292</pubid>
                  <pubid idtype="pmcid">546038</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B17">
            <title>
               <p>The map-based sequence of the rice genome</p>
            </title>
            <source>Nature</source>
            <pubdate>2005</pubdate>
            <volume>436</volume>
            <issue>7052</issue>
            <fpage>793</fpage>
            <lpage>800</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1038/nature03895</pubid>
                  <pubid idtype="pmpid" link="fulltext">16100779</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B18">
            <title>
               <p>Mismatch repair in replication fidelity, genetic recombination, and cancer biology</p>
            </title>
            <aug>
               <au>
                  <snm>Modrich</snm>
                  <fnm>P</fnm>
               </au>
               <au>
                  <snm>Lahue</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Annu Rev Biochem</source>
            <pubdate>1996</pubdate>
            <volume>65</volume>
            <fpage>101</fpage>
            <lpage>133</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.bi.65.070196.000533</pubid>
                  <pubid idtype="pmpid" link="fulltext">8811176</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B19">
            <title>
               <p>Database resources of the National Center for Biotechnology Information</p>
            </title>
            <aug>
               <au>
                  <snm>Wheeler</snm>
                  <fnm>DL</fnm>
               </au>
               <au>
                  <snm>Barrett</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Benson</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Bryant</snm>
                  <fnm>SH</fnm>
               </au>
               <au>
                  <snm>Canese</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Chetvernin</snm>
                  <fnm>V</fnm>
               </au>
               <au>
                  <snm>Church</snm>
                  <fnm>DM</fnm>
               </au>
               <au>
                  <snm>DiCuccio</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Edgar</snm>
                  <fnm>R</fnm>
               </au>
               <au>
                  <snm>Federhen</snm>
                  <fnm>S</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <issue>35 Database</issue>
            <fpage>D5</fpage>
            <lpage>12</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1781113</pubid>
                  <pubid idtype="pmpid" link="fulltext">17170002</pubid>
                  <pubid idtype="doi">10.1093/nar/gkl1031</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B20">
            <title>
               <p>Substitution rate comparisons between grasses and palms: Synonymous rate differences at the nuclear gene Adh parallel rate differences at the plastid gene rbcL</p>
            </title>
            <aug>
               <au>
                  <snm>Gaut</snm>
                  <fnm>BS</fnm>
               </au>
               <au>
                  <snm>Morton</snm>
                  <fnm>BR</fnm>
               </au>
               <au>
                  <snm>McCaig</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Clegg</snm>
                  <fnm>MT</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1996</pubdate>
            <volume>93</volume>
            <issue>19</issue>
            <fpage>10274</fpage>
            <lpage>10279</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">38374</pubid>
                  <pubid idtype="pmpid" link="fulltext">8816790</pubid>
                  <pubid idtype="doi">10.1073/pnas.93.19.10274</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B21">
            <title>
               <p>Phospholipid signalling in plant defence</p>
            </title>
            <aug>
               <au>
                  <snm>Laxalt</snm>
                  <fnm>AM</fnm>
               </au>
               <au>
                  <snm>Munnik</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Curr Opin Plant Biol</source>
            <pubdate>2002</pubdate>
            <volume>5</volume>
            <issue>4</issue>
            <fpage>332</fpage>
            <lpage>338</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S1369-5266(02)00268-6</pubid>
                  <pubid idtype="pmpid">12179967</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B22">
            <title>
               <p>A human-specific gene in microglia</p>
            </title>
            <aug>
               <au>
                  <snm>Hayakawa</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Angata</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Lewis</snm>
                  <fnm>AL</fnm>
               </au>
               <au>
                  <snm>Mikkelsen</snm>
                  <fnm>TS</fnm>
               </au>
               <au>
                  <snm>Varki</snm>
                  <fnm>NM</fnm>
               </au>
               <au>
                  <snm>Varki</snm>
                  <fnm>A</fnm>
               </au>
            </aug>
            <source>Science</source>
            <pubdate>2005</pubdate>
            <volume>309</volume>
            <issue>5741</issue>
            <fpage>1693</fpage>
            <lpage>1693</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">16151003</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B23">
            <title>
               <p>Pseudogenes: are they "junk" or functional DNA?</p>
            </title>
            <aug>
               <au>
                  <snm>Balakirev</snm>
                  <fnm>ES</fnm>
               </au>
               <au>
                  <snm>Ayala</snm>
                  <fnm>FJ</fnm>
               </au>
            </aug>
            <source>Annu Rev Genet</source>
            <pubdate>2003</pubdate>
            <volume>37</volume>
            <fpage>123</fpage>
            <lpage>151</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1146/annurev.genet.37.040103.103949</pubid>
                  <pubid idtype="pmpid" link="fulltext">14616058</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B24">
            <title>
               <p>Novel disease resistance specificities result from sequence exchange between tandemly repeated genes at the Cf-4/9 locus of tomato</p>
            </title>
            <aug>
               <au>
                  <snm>Parniske</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>HammondKosack</snm>
                  <fnm>KE</fnm>
               </au>
               <au>
                  <snm>Golstein</snm>
                  <fnm>C</fnm>
               </au>
               <au>
                  <snm>Thomas</snm>
                  <fnm>CM</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>DA</fnm>
               </au>
               <au>
                  <snm>Harrison</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Wulff</snm>
                  <fnm>BBH</fnm>
               </au>
               <au>
                  <snm>Jones</snm>
                  <fnm>JDG</fnm>
               </au>
            </aug>
            <source>Cell</source>
            <pubdate>1997</pubdate>
            <volume>91</volume>
            <issue>6</issue>
            <fpage>821</fpage>
            <lpage>832</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0092-8674(00)80470-5</pubid>
                  <pubid idtype="pmpid" link="fulltext">9413991</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B25">
            <title>
               <p>Accuracy and power of statistical methods for detecting adaptive evolution in protein coding sequences and for identifying positively selected sites</p>
            </title>
            <aug>
               <au>
                  <snm>Wong</snm>
                  <fnm>WSW</fnm>
               </au>
               <au>
                  <snm>Yang</snm>
                  <fnm>ZH</fnm>
               </au>
               <au>
                  <snm>Goldman</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Nielsen</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Genetics</source>
            <pubdate>2004</pubdate>
            <volume>168</volume>
            <issue>2</issue>
            <fpage>1041</fpage>
            <lpage>1051</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1448811</pubid>
                  <pubid idtype="pmpid" link="fulltext">15514074</pubid>
                  <pubid idtype="doi">10.1534/genetics.104.031153</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B26">
            <title>
               <p>Multiple genetic processes result in heterogeneous rates of evolution within the major cluster disease resistance genes in lettuce</p>
            </title>
            <aug>
               <au>
                  <snm>Kuang</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Woo</snm>
                  <fnm>SS</fnm>
               </au>
               <au>
                  <snm>Meyers</snm>
                  <fnm>BC</fnm>
               </au>
               <au>
                  <snm>Nevo</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Michelmore</snm>
                  <fnm>RW</fnm>
               </au>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2004</pubdate>
            <volume>16</volume>
            <issue>11</issue>
            <fpage>2870</fpage>
            <lpage>2894</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">527186</pubid>
                  <pubid idtype="pmpid" link="fulltext">15494555</pubid>
                  <pubid idtype="doi">10.1105/tpc.104.025502</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B27">
            <title>
               <p>Rapid Duplication and Loss of Genes-Coding for the Alpha-Chains of Hemoglobin</p>
            </title>
            <aug>
               <au>
                  <snm>Zimmer</snm>
                  <fnm>EA</fnm>
               </au>
               <au>
                  <snm>Martin</snm>
                  <fnm>SL</fnm>
               </au>
               <au>
                  <snm>Beverley</snm>
                  <fnm>SM</fnm>
               </au>
               <au>
                  <snm>Kan</snm>
                  <fnm>YW</fnm>
               </au>
               <au>
                  <snm>Wilson</snm>
                  <fnm>AC</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1980</pubdate>
            <volume>77</volume>
            <issue>4</issue>
            <fpage>2158</fpage>
            <lpage>2162</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">348671</pubid>
                  <pubid idtype="pmpid">6929543</pubid>
                  <pubid idtype="doi">10.1073/pnas.77.4.2158</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B28">
            <title>
               <p>Role of Diversifying Selection and Gene Conversion in Evolution of Major Histocompatibility Complex Loci</p>
            </title>
            <aug>
               <au>
                  <snm>Ohta</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Proc Natl Acad Sci USA</source>
            <pubdate>1991</pubdate>
            <volume>88</volume>
            <issue>15</issue>
            <fpage>6716</fpage>
            <lpage>6720</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">52159</pubid>
                  <pubid idtype="pmpid" link="fulltext">1862096</pubid>
                  <pubid idtype="doi">10.1073/pnas.88.15.6716</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B29">
            <title>
               <p>Role of gene conversion in generating polymorphisms at major histocompatibility complex loci</p>
            </title>
            <aug>
               <au>
                  <snm>Ohta</snm>
                  <fnm>T</fnm>
               </au>
            </aug>
            <source>Hereditas</source>
            <pubdate>1997</pubdate>
            <volume>127</volume>
            <issue>1&#8211;2</issue>
            <fpage>97</fpage>
            <lpage>103</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1111/j.1601-5223.1997.00097.x</pubid>
                  <pubid idtype="pmpid">9420475</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B30">
            <title>
               <p>Collection, mapping, and annotation of over 28,000 cDNA clones from japonica rice</p>
            </title>
            <aug>
               <au>
                  <snm>Kikuchi</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Satoh</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Nagata</snm>
                  <fnm>T</fnm>
               </au>
               <au>
                  <snm>Kawagashira</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Doi</snm>
                  <fnm>K</fnm>
               </au>
               <au>
                  <snm>Kishimoto</snm>
                  <fnm>N</fnm>
               </au>
               <au>
                  <snm>Yazaki</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Ishikawa</snm>
                  <fnm>M</fnm>
               </au>
               <au>
                  <snm>Yamada</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Ooka</snm>
                  <fnm>H</fnm>
               </au>
               <etal/>
            </aug>
            <source>Science</source>
            <pubdate>2003</pubdate>
            <volume>301</volume>
            <issue>5631</issue>
            <fpage>376</fpage>
            <lpage>379</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1126/science.1081288</pubid>
                  <pubid idtype="pmpid" link="fulltext">12869764</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B31">
            <title>
               <p>BLAT &#8211; the BLAST-like alignment tool</p>
            </title>
            <aug>
               <au>
                  <snm>Kent</snm>
                  <fnm>WJ</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2002</pubdate>
            <volume>12</volume>
            <issue>4</issue>
            <fpage>656</fpage>
            <lpage>664</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">187518</pubid>
                  <pubid idtype="pmpid" link="fulltext">11932250</pubid>
                  <pubid idtype="doi">10.1101/gr.229202. Article published online before March 2002</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B32">
            <title>
               <p>Repeats in genomic DNA: mining and meaning</p>
            </title>
            <aug>
               <au>
                  <snm>Jurka</snm>
                  <fnm>J</fnm>
               </au>
            </aug>
            <source>Curr Opin Struct Biol</source>
            <pubdate>1998</pubdate>
            <volume>8</volume>
            <issue>3</issue>
            <fpage>333</fpage>
            <lpage>337</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1016/S0959-440X(98)80067-5</pubid>
                  <pubid idtype="pmpid" link="fulltext">9666329</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B33">
            <title>
               <p>High rate of chimeric gene origination by retroposition in plant genomes</p>
            </title>
            <aug>
               <au>
                  <snm>Wang</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Zheng</snm>
                  <fnm>HK</fnm>
               </au>
               <au>
                  <snm>Fan</snm>
                  <fnm>CZ</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Shi</snm>
                  <fnm>JJ</fnm>
               </au>
               <au>
                  <snm>Cai</snm>
                  <fnm>ZQ</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>GJ</fnm>
               </au>
               <au>
                  <snm>Liu</snm>
                  <fnm>DY</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>JG</fnm>
               </au>
               <au>
                  <snm>Vang</snm>
                  <fnm>S</fnm>
               </au>
               <etal/>
            </aug>
            <source>Plant Cell</source>
            <pubdate>2006</pubdate>
            <volume>18</volume>
            <issue>8</issue>
            <fpage>1791</fpage>
            <lpage>1802</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1533979</pubid>
                  <pubid idtype="pmpid" link="fulltext">16829590</pubid>
                  <pubid idtype="doi">10.1105/tpc.106.041905</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B34">
            <title>
               <p>Basic local alignment search tool</p>
            </title>
            <aug>
               <au>
                  <snm>Altschul</snm>
                  <fnm>SF</fnm>
               </au>
               <au>
                  <snm>Gish</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Miller</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Myers</snm>
                  <fnm>EW</fnm>
               </au>
               <au>
                  <snm>Lipman</snm>
                  <fnm>DJ</fnm>
               </au>
            </aug>
            <source>J Mol Biol</source>
            <pubdate>1990</pubdate>
            <volume>215</volume>
            <issue>3</issue>
            <fpage>403</fpage>
            <lpage>410</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">2231712</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B35">
            <title>
               <p>FGF: a web tool for Fishing Gene Family in a whole genome database</p>
            </title>
            <aug>
               <au>
                  <snm>Zheng</snm>
                  <fnm>H</fnm>
               </au>
               <au>
                  <snm>Shi</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Fang</snm>
                  <fnm>X</fnm>
               </au>
               <au>
                  <snm>Li</snm>
                  <fnm>Y</fnm>
               </au>
               <au>
                  <snm>Vang</snm>
                  <fnm>S</fnm>
               </au>
               <au>
                  <snm>Fan</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>J</fnm>
               </au>
               <au>
                  <snm>Zhang</snm>
                  <fnm>Z</fnm>
               </au>
               <au>
                  <snm>Wang</snm>
                  <fnm>W</fnm>
               </au>
               <au>
                  <snm>Kristiansen</snm>
                  <fnm>K</fnm>
               </au>
               <etal/>
            </aug>
            <source>Nucleic Acids Res</source>
            <pubdate>2007</pubdate>
            <issue>35 Web Server</issue>
            <fpage>W121</fpage>
            <lpage>125</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">1933194</pubid>
                  <pubid idtype="pmpid" link="fulltext">17584790</pubid>
                  <pubid idtype="doi">10.1093/nar/gkm426</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B36">
            <title>
               <p>Using GeneWise in the Drosophila annotation experiment</p>
            </title>
            <aug>
               <au>
                  <snm>Birney</snm>
                  <fnm>E</fnm>
               </au>
               <au>
                  <snm>Durbin</snm>
                  <fnm>R</fnm>
               </au>
            </aug>
            <source>Genome Res</source>
            <pubdate>2000</pubdate>
            <volume>10</volume>
            <issue>4</issue>
            <fpage>547</fpage>
            <lpage>548</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="pmcid">310858</pubid>
                  <pubid idtype="pmpid" link="fulltext">10779496</pubid>
                  <pubid idtype="doi">10.1101/gr.10.4.547</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B37">
            <title>
               <p>Statistical Tests for Detecting Gene Conversion</p>
            </title>
            <aug>
               <au>
                  <snm>Sawyer</snm>
                  <fnm>S</fnm>
               </au>
            </aug>
            <source>Mol Biol Evol</source>
            <pubdate>1989</pubdate>
            <volume>6</volume>
            <issue>5</issue>
            <fpage>526</fpage>
            <lpage>538</lpage>
            <xrefbib>
               <pubid idtype="pmpid" link="fulltext">2677599</pubid>
            </xrefbib>
         </bibl>
         <bibl id="B38">
            <title>
               <p>Unbiased Estimation of the Rates of Synonymous and Nonsynonymous Substitution</p>
            </title>
            <aug>
               <au>
                  <snm>Li</snm>
                  <fnm>WH</fnm>
               </au>
            </aug>
            <source>J Mol Evol</source>
            <pubdate>1993</pubdate>
            <volume>36</volume>
            <issue>1</issue>
            <fpage>96</fpage>
            <lpage>99</lpage>
            <xrefbib>
               <pubidlist>
                  <pubid idtype="doi">10.1007/BF02407308</pubid>
                  <pubid idtype="pmpid">8433381</pubid>
               </pubidlist>
            </xrefbib>
         </bibl>
         <bibl id="B39">
            <title>
               <p>NCBI</p>
            </title>
            <url>http://www.ncbi.nlm.nih.gov/</url>
         </bibl>
      </refgrp>
   </bm>
</art>
